Index: tests/lib/convert/utf84_test.dart |
diff --git a/tests/lib/convert/utf84_test.dart b/tests/lib/convert/utf84_test.dart |
index ddd1dc98448a4947e74318f4fab59dc3eaa69692..6a7d85cc3e8917a06c3519d449986268d826e2db 100755 |
--- a/tests/lib/convert/utf84_test.dart |
+++ b/tests/lib/convert/utf84_test.dart |
@@ -5,111 +5,620 @@ |
import 'package:expect/expect.dart'; |
import 'dart:convert'; |
-const String testEnglishPhrase = |
- "The quick brown fox jumps over the lazy dog."; |
- |
-const List<int> testEnglishUtf8 = const<int> [ |
- 0x54, 0x68, 0x65, 0x20, 0x71, 0x75, 0x69, 0x63, |
- 0x6b, 0x20, 0x62, 0x72, 0x6f, 0x77, 0x6e, 0x20, |
- 0x66, 0x6f, 0x78, 0x20, 0x6a, 0x75, 0x6d, 0x70, |
- 0x73, 0x20, 0x6f, 0x76, 0x65, 0x72, 0x20, 0x74, |
- 0x68, 0x65, 0x20, 0x6c, 0x61, 0x7a, 0x79, 0x20, |
- 0x64, 0x6f, 0x67, 0x2e]; |
+const String testEnglishPhrase = "The quick brown fox jumps over the lazy dog."; |
+ |
+const List<int> testEnglishUtf8 = const <int>[ |
+ 0x54, |
+ 0x68, |
+ 0x65, |
+ 0x20, |
+ 0x71, |
+ 0x75, |
+ 0x69, |
+ 0x63, |
+ 0x6b, |
+ 0x20, |
+ 0x62, |
+ 0x72, |
+ 0x6f, |
+ 0x77, |
+ 0x6e, |
+ 0x20, |
+ 0x66, |
+ 0x6f, |
+ 0x78, |
+ 0x20, |
+ 0x6a, |
+ 0x75, |
+ 0x6d, |
+ 0x70, |
+ 0x73, |
+ 0x20, |
+ 0x6f, |
+ 0x76, |
+ 0x65, |
+ 0x72, |
+ 0x20, |
+ 0x74, |
+ 0x68, |
+ 0x65, |
+ 0x20, |
+ 0x6c, |
+ 0x61, |
+ 0x7a, |
+ 0x79, |
+ 0x20, |
+ 0x64, |
+ 0x6f, |
+ 0x67, |
+ 0x2e |
+]; |
const String testDanishPhrase = "Quizdeltagerne spiste jordbær med " |
"fløde mens cirkusklovnen Wolther spillede på xylofon."; |
-const List<int> testDanishUtf8 = const<int>[ |
- 0x51, 0x75, 0x69, 0x7a, 0x64, 0x65, 0x6c, 0x74, |
- 0x61, 0x67, 0x65, 0x72, 0x6e, 0x65, 0x20, 0x73, |
- 0x70, 0x69, 0x73, 0x74, 0x65, 0x20, 0x6a, 0x6f, |
- 0x72, 0x64, 0x62, 0xc3, 0xa6, 0x72, 0x20, 0x6d, |
- 0x65, 0x64, 0x20, 0x66, 0x6c, 0xc3, 0xb8, 0x64, |
- 0x65, 0x20, 0x6d, 0x65, 0x6e, 0x73, 0x20, 0x63, |
- 0x69, 0x72, 0x6b, 0x75, 0x73, 0x6b, 0x6c, 0x6f, |
- 0x76, 0x6e, 0x65, 0x6e, 0x20, 0x57, 0x6f, 0x6c, |
- 0x74, 0x68, 0x65, 0x72, 0x20, 0x73, 0x70, 0x69, |
- 0x6c, 0x6c, 0x65, 0x64, 0x65, 0x20, 0x70, 0xc3, |
- 0xa5, 0x20, 0x78, 0x79, 0x6c, 0x6f, 0x66, 0x6f, |
- 0x6e, 0x2e]; |
+const List<int> testDanishUtf8 = const <int>[ |
+ 0x51, |
+ 0x75, |
+ 0x69, |
+ 0x7a, |
+ 0x64, |
+ 0x65, |
+ 0x6c, |
+ 0x74, |
+ 0x61, |
+ 0x67, |
+ 0x65, |
+ 0x72, |
+ 0x6e, |
+ 0x65, |
+ 0x20, |
+ 0x73, |
+ 0x70, |
+ 0x69, |
+ 0x73, |
+ 0x74, |
+ 0x65, |
+ 0x20, |
+ 0x6a, |
+ 0x6f, |
+ 0x72, |
+ 0x64, |
+ 0x62, |
+ 0xc3, |
+ 0xa6, |
+ 0x72, |
+ 0x20, |
+ 0x6d, |
+ 0x65, |
+ 0x64, |
+ 0x20, |
+ 0x66, |
+ 0x6c, |
+ 0xc3, |
+ 0xb8, |
+ 0x64, |
+ 0x65, |
+ 0x20, |
+ 0x6d, |
+ 0x65, |
+ 0x6e, |
+ 0x73, |
+ 0x20, |
+ 0x63, |
+ 0x69, |
+ 0x72, |
+ 0x6b, |
+ 0x75, |
+ 0x73, |
+ 0x6b, |
+ 0x6c, |
+ 0x6f, |
+ 0x76, |
+ 0x6e, |
+ 0x65, |
+ 0x6e, |
+ 0x20, |
+ 0x57, |
+ 0x6f, |
+ 0x6c, |
+ 0x74, |
+ 0x68, |
+ 0x65, |
+ 0x72, |
+ 0x20, |
+ 0x73, |
+ 0x70, |
+ 0x69, |
+ 0x6c, |
+ 0x6c, |
+ 0x65, |
+ 0x64, |
+ 0x65, |
+ 0x20, |
+ 0x70, |
+ 0xc3, |
+ 0xa5, |
+ 0x20, |
+ 0x78, |
+ 0x79, |
+ 0x6c, |
+ 0x6f, |
+ 0x66, |
+ 0x6f, |
+ 0x6e, |
+ 0x2e |
+]; |
// unusual formatting due to strange editor interaction w/ text direction. |
-const String |
- testHebrewPhrase = "דג סקרן שט בים מאוכזב ולפתע מצא לו חברה איך הקליטה"; |
- |
-const List<int> testHebrewUtf8 = const<int>[ |
- 0xd7, 0x93, 0xd7, 0x92, 0x20, 0xd7, 0xa1, 0xd7, |
- 0xa7, 0xd7, 0xa8, 0xd7, 0x9f, 0x20, 0xd7, 0xa9, |
- 0xd7, 0x98, 0x20, 0xd7, 0x91, 0xd7, 0x99, 0xd7, |
- 0x9d, 0x20, 0xd7, 0x9e, 0xd7, 0x90, 0xd7, 0x95, |
- 0xd7, 0x9b, 0xd7, 0x96, 0xd7, 0x91, 0x20, 0xd7, |
- 0x95, 0xd7, 0x9c, 0xd7, 0xa4, 0xd7, 0xaa, 0xd7, |
- 0xa2, 0x20, 0xd7, 0x9e, 0xd7, 0xa6, 0xd7, 0x90, |
- 0x20, 0xd7, 0x9c, 0xd7, 0x95, 0x20, 0xd7, 0x97, |
- 0xd7, 0x91, 0xd7, 0xa8, 0xd7, 0x94, 0x20, 0xd7, |
- 0x90, 0xd7, 0x99, 0xd7, 0x9a, 0x20, 0xd7, 0x94, |
- 0xd7, 0xa7, 0xd7, 0x9c, 0xd7, 0x99, 0xd7, 0x98, |
- 0xd7, 0x94]; |
+const String testHebrewPhrase = |
+ "דג סקרן שט בים מאוכזב ולפתע מצא לו חברה איך הקליטה"; |
+ |
+const List<int> testHebrewUtf8 = const <int>[ |
+ 0xd7, |
+ 0x93, |
+ 0xd7, |
+ 0x92, |
+ 0x20, |
+ 0xd7, |
+ 0xa1, |
+ 0xd7, |
+ 0xa7, |
+ 0xd7, |
+ 0xa8, |
+ 0xd7, |
+ 0x9f, |
+ 0x20, |
+ 0xd7, |
+ 0xa9, |
+ 0xd7, |
+ 0x98, |
+ 0x20, |
+ 0xd7, |
+ 0x91, |
+ 0xd7, |
+ 0x99, |
+ 0xd7, |
+ 0x9d, |
+ 0x20, |
+ 0xd7, |
+ 0x9e, |
+ 0xd7, |
+ 0x90, |
+ 0xd7, |
+ 0x95, |
+ 0xd7, |
+ 0x9b, |
+ 0xd7, |
+ 0x96, |
+ 0xd7, |
+ 0x91, |
+ 0x20, |
+ 0xd7, |
+ 0x95, |
+ 0xd7, |
+ 0x9c, |
+ 0xd7, |
+ 0xa4, |
+ 0xd7, |
+ 0xaa, |
+ 0xd7, |
+ 0xa2, |
+ 0x20, |
+ 0xd7, |
+ 0x9e, |
+ 0xd7, |
+ 0xa6, |
+ 0xd7, |
+ 0x90, |
+ 0x20, |
+ 0xd7, |
+ 0x9c, |
+ 0xd7, |
+ 0x95, |
+ 0x20, |
+ 0xd7, |
+ 0x97, |
+ 0xd7, |
+ 0x91, |
+ 0xd7, |
+ 0xa8, |
+ 0xd7, |
+ 0x94, |
+ 0x20, |
+ 0xd7, |
+ 0x90, |
+ 0xd7, |
+ 0x99, |
+ 0xd7, |
+ 0x9a, |
+ 0x20, |
+ 0xd7, |
+ 0x94, |
+ 0xd7, |
+ 0xa7, |
+ 0xd7, |
+ 0x9c, |
+ 0xd7, |
+ 0x99, |
+ 0xd7, |
+ 0x98, |
+ 0xd7, |
+ 0x94 |
+]; |
const String testRussianPhrase = "Съешь же ещё этих мягких " |
"французских булок да выпей чаю"; |
-const List<int> testRussianUtf8 = const<int>[ |
- 0xd0, 0xa1, 0xd1, 0x8a, 0xd0, 0xb5, 0xd1, 0x88, |
- 0xd1, 0x8c, 0x20, 0xd0, 0xb6, 0xd0, 0xb5, 0x20, |
- 0xd0, 0xb5, 0xd1, 0x89, 0xd1, 0x91, 0x20, 0xd1, |
- 0x8d, 0xd1, 0x82, 0xd0, 0xb8, 0xd1, 0x85, 0x20, |
- 0xd0, 0xbc, 0xd1, 0x8f, 0xd0, 0xb3, 0xd0, 0xba, |
- 0xd0, 0xb8, 0xd1, 0x85, 0x20, 0xd1, 0x84, 0xd1, |
- 0x80, 0xd0, 0xb0, 0xd0, 0xbd, 0xd1, 0x86, 0xd1, |
- 0x83, 0xd0, 0xb7, 0xd1, 0x81, 0xd0, 0xba, 0xd0, |
- 0xb8, 0xd1, 0x85, 0x20, 0xd0, 0xb1, 0xd1, 0x83, |
- 0xd0, 0xbb, 0xd0, 0xbe, 0xd0, 0xba, 0x20, 0xd0, |
- 0xb4, 0xd0, 0xb0, 0x20, 0xd0, 0xb2, 0xd1, 0x8b, |
- 0xd0, 0xbf, 0xd0, 0xb5, 0xd0, 0xb9, 0x20, 0xd1, |
- 0x87, 0xd0, 0xb0, 0xd1, 0x8e]; |
+const List<int> testRussianUtf8 = const <int>[ |
+ 0xd0, |
+ 0xa1, |
+ 0xd1, |
+ 0x8a, |
+ 0xd0, |
+ 0xb5, |
+ 0xd1, |
+ 0x88, |
+ 0xd1, |
+ 0x8c, |
+ 0x20, |
+ 0xd0, |
+ 0xb6, |
+ 0xd0, |
+ 0xb5, |
+ 0x20, |
+ 0xd0, |
+ 0xb5, |
+ 0xd1, |
+ 0x89, |
+ 0xd1, |
+ 0x91, |
+ 0x20, |
+ 0xd1, |
+ 0x8d, |
+ 0xd1, |
+ 0x82, |
+ 0xd0, |
+ 0xb8, |
+ 0xd1, |
+ 0x85, |
+ 0x20, |
+ 0xd0, |
+ 0xbc, |
+ 0xd1, |
+ 0x8f, |
+ 0xd0, |
+ 0xb3, |
+ 0xd0, |
+ 0xba, |
+ 0xd0, |
+ 0xb8, |
+ 0xd1, |
+ 0x85, |
+ 0x20, |
+ 0xd1, |
+ 0x84, |
+ 0xd1, |
+ 0x80, |
+ 0xd0, |
+ 0xb0, |
+ 0xd0, |
+ 0xbd, |
+ 0xd1, |
+ 0x86, |
+ 0xd1, |
+ 0x83, |
+ 0xd0, |
+ 0xb7, |
+ 0xd1, |
+ 0x81, |
+ 0xd0, |
+ 0xba, |
+ 0xd0, |
+ 0xb8, |
+ 0xd1, |
+ 0x85, |
+ 0x20, |
+ 0xd0, |
+ 0xb1, |
+ 0xd1, |
+ 0x83, |
+ 0xd0, |
+ 0xbb, |
+ 0xd0, |
+ 0xbe, |
+ 0xd0, |
+ 0xba, |
+ 0x20, |
+ 0xd0, |
+ 0xb4, |
+ 0xd0, |
+ 0xb0, |
+ 0x20, |
+ 0xd0, |
+ 0xb2, |
+ 0xd1, |
+ 0x8b, |
+ 0xd0, |
+ 0xbf, |
+ 0xd0, |
+ 0xb5, |
+ 0xd0, |
+ 0xb9, |
+ 0x20, |
+ 0xd1, |
+ 0x87, |
+ 0xd0, |
+ 0xb0, |
+ 0xd1, |
+ 0x8e |
+]; |
const String testGreekPhrase = "Γαζέες καὶ μυρτιὲς δὲν θὰ βρῶ πιὰ " |
"στὸ χρυσαφὶ ξέφωτο"; |
-const List<int> testGreekUtf8 = const<int>[ |
- 0xce, 0x93, 0xce, 0xb1, 0xce, 0xb6, 0xce, 0xad, |
- 0xce, 0xb5, 0xcf, 0x82, 0x20, 0xce, 0xba, 0xce, |
- 0xb1, 0xe1, 0xbd, 0xb6, 0x20, 0xce, 0xbc, 0xcf, |
- 0x85, 0xcf, 0x81, 0xcf, 0x84, 0xce, 0xb9, 0xe1, |
- 0xbd, 0xb2, 0xcf, 0x82, 0x20, 0xce, 0xb4, 0xe1, |
- 0xbd, 0xb2, 0xce, 0xbd, 0x20, 0xce, 0xb8, 0xe1, |
- 0xbd, 0xb0, 0x20, 0xce, 0xb2, 0xcf, 0x81, 0xe1, |
- 0xbf, 0xb6, 0x20, 0xcf, 0x80, 0xce, 0xb9, 0xe1, |
- 0xbd, 0xb0, 0x20, 0xcf, 0x83, 0xcf, 0x84, 0xe1, |
- 0xbd, 0xb8, 0x20, 0xcf, 0x87, 0xcf, 0x81, 0xcf, |
- 0x85, 0xcf, 0x83, 0xce, 0xb1, 0xcf, 0x86, 0xe1, |
- 0xbd, 0xb6, 0x20, 0xce, 0xbe, 0xce, 0xad, 0xcf, |
- 0x86, 0xcf, 0x89, 0xcf, 0x84, 0xce, 0xbf]; |
+const List<int> testGreekUtf8 = const <int>[ |
+ 0xce, |
+ 0x93, |
+ 0xce, |
+ 0xb1, |
+ 0xce, |
+ 0xb6, |
+ 0xce, |
+ 0xad, |
+ 0xce, |
+ 0xb5, |
+ 0xcf, |
+ 0x82, |
+ 0x20, |
+ 0xce, |
+ 0xba, |
+ 0xce, |
+ 0xb1, |
+ 0xe1, |
+ 0xbd, |
+ 0xb6, |
+ 0x20, |
+ 0xce, |
+ 0xbc, |
+ 0xcf, |
+ 0x85, |
+ 0xcf, |
+ 0x81, |
+ 0xcf, |
+ 0x84, |
+ 0xce, |
+ 0xb9, |
+ 0xe1, |
+ 0xbd, |
+ 0xb2, |
+ 0xcf, |
+ 0x82, |
+ 0x20, |
+ 0xce, |
+ 0xb4, |
+ 0xe1, |
+ 0xbd, |
+ 0xb2, |
+ 0xce, |
+ 0xbd, |
+ 0x20, |
+ 0xce, |
+ 0xb8, |
+ 0xe1, |
+ 0xbd, |
+ 0xb0, |
+ 0x20, |
+ 0xce, |
+ 0xb2, |
+ 0xcf, |
+ 0x81, |
+ 0xe1, |
+ 0xbf, |
+ 0xb6, |
+ 0x20, |
+ 0xcf, |
+ 0x80, |
+ 0xce, |
+ 0xb9, |
+ 0xe1, |
+ 0xbd, |
+ 0xb0, |
+ 0x20, |
+ 0xcf, |
+ 0x83, |
+ 0xcf, |
+ 0x84, |
+ 0xe1, |
+ 0xbd, |
+ 0xb8, |
+ 0x20, |
+ 0xcf, |
+ 0x87, |
+ 0xcf, |
+ 0x81, |
+ 0xcf, |
+ 0x85, |
+ 0xcf, |
+ 0x83, |
+ 0xce, |
+ 0xb1, |
+ 0xcf, |
+ 0x86, |
+ 0xe1, |
+ 0xbd, |
+ 0xb6, |
+ 0x20, |
+ 0xce, |
+ 0xbe, |
+ 0xce, |
+ 0xad, |
+ 0xcf, |
+ 0x86, |
+ 0xcf, |
+ 0x89, |
+ 0xcf, |
+ 0x84, |
+ 0xce, |
+ 0xbf |
+]; |
const String testKatakanaPhrase = "イロハニホヘト チリヌルヲ ワカヨタレソ " |
"ツネナラム ウヰノオクヤマ ケフコエテ アサキユメミシ ヱヒモセスン"; |
-const List<int> testKatakanaUtf8 = const<int>[ |
- 0xe3, 0x82, 0xa4, 0xe3, 0x83, 0xad, 0xe3, 0x83, |
- 0x8f, 0xe3, 0x83, 0x8b, 0xe3, 0x83, 0x9b, 0xe3, |
- 0x83, 0x98, 0xe3, 0x83, 0x88, 0x20, 0xe3, 0x83, |
- 0x81, 0xe3, 0x83, 0xaa, 0xe3, 0x83, 0x8c, 0xe3, |
- 0x83, 0xab, 0xe3, 0x83, 0xb2, 0x20, 0xe3, 0x83, |
- 0xaf, 0xe3, 0x82, 0xab, 0xe3, 0x83, 0xa8, 0xe3, |
- 0x82, 0xbf, 0xe3, 0x83, 0xac, 0xe3, 0x82, 0xbd, |
- 0x20, 0xe3, 0x83, 0x84, 0xe3, 0x83, 0x8d, 0xe3, |
- 0x83, 0x8a, 0xe3, 0x83, 0xa9, 0xe3, 0x83, 0xa0, |
- 0x20, 0xe3, 0x82, 0xa6, 0xe3, 0x83, 0xb0, 0xe3, |
- 0x83, 0x8e, 0xe3, 0x82, 0xaa, 0xe3, 0x82, 0xaf, |
- 0xe3, 0x83, 0xa4, 0xe3, 0x83, 0x9e, 0x20, 0xe3, |
- 0x82, 0xb1, 0xe3, 0x83, 0x95, 0xe3, 0x82, 0xb3, |
- 0xe3, 0x82, 0xa8, 0xe3, 0x83, 0x86, 0x20, 0xe3, |
- 0x82, 0xa2, 0xe3, 0x82, 0xb5, 0xe3, 0x82, 0xad, |
- 0xe3, 0x83, 0xa6, 0xe3, 0x83, 0xa1, 0xe3, 0x83, |
- 0x9f, 0xe3, 0x82, 0xb7, 0x20, 0xe3, 0x83, 0xb1, |
- 0xe3, 0x83, 0x92, 0xe3, 0x83, 0xa2, 0xe3, 0x82, |
- 0xbb, 0xe3, 0x82, 0xb9, 0xe3, 0x83, 0xb3]; |
+const List<int> testKatakanaUtf8 = const <int>[ |
+ 0xe3, |
+ 0x82, |
+ 0xa4, |
+ 0xe3, |
+ 0x83, |
+ 0xad, |
+ 0xe3, |
+ 0x83, |
+ 0x8f, |
+ 0xe3, |
+ 0x83, |
+ 0x8b, |
+ 0xe3, |
+ 0x83, |
+ 0x9b, |
+ 0xe3, |
+ 0x83, |
+ 0x98, |
+ 0xe3, |
+ 0x83, |
+ 0x88, |
+ 0x20, |
+ 0xe3, |
+ 0x83, |
+ 0x81, |
+ 0xe3, |
+ 0x83, |
+ 0xaa, |
+ 0xe3, |
+ 0x83, |
+ 0x8c, |
+ 0xe3, |
+ 0x83, |
+ 0xab, |
+ 0xe3, |
+ 0x83, |
+ 0xb2, |
+ 0x20, |
+ 0xe3, |
+ 0x83, |
+ 0xaf, |
+ 0xe3, |
+ 0x82, |
+ 0xab, |
+ 0xe3, |
+ 0x83, |
+ 0xa8, |
+ 0xe3, |
+ 0x82, |
+ 0xbf, |
+ 0xe3, |
+ 0x83, |
+ 0xac, |
+ 0xe3, |
+ 0x82, |
+ 0xbd, |
+ 0x20, |
+ 0xe3, |
+ 0x83, |
+ 0x84, |
+ 0xe3, |
+ 0x83, |
+ 0x8d, |
+ 0xe3, |
+ 0x83, |
+ 0x8a, |
+ 0xe3, |
+ 0x83, |
+ 0xa9, |
+ 0xe3, |
+ 0x83, |
+ 0xa0, |
+ 0x20, |
+ 0xe3, |
+ 0x82, |
+ 0xa6, |
+ 0xe3, |
+ 0x83, |
+ 0xb0, |
+ 0xe3, |
+ 0x83, |
+ 0x8e, |
+ 0xe3, |
+ 0x82, |
+ 0xaa, |
+ 0xe3, |
+ 0x82, |
+ 0xaf, |
+ 0xe3, |
+ 0x83, |
+ 0xa4, |
+ 0xe3, |
+ 0x83, |
+ 0x9e, |
+ 0x20, |
+ 0xe3, |
+ 0x82, |
+ 0xb1, |
+ 0xe3, |
+ 0x83, |
+ 0x95, |
+ 0xe3, |
+ 0x82, |
+ 0xb3, |
+ 0xe3, |
+ 0x82, |
+ 0xa8, |
+ 0xe3, |
+ 0x83, |
+ 0x86, |
+ 0x20, |
+ 0xe3, |
+ 0x82, |
+ 0xa2, |
+ 0xe3, |
+ 0x82, |
+ 0xb5, |
+ 0xe3, |
+ 0x82, |
+ 0xad, |
+ 0xe3, |
+ 0x83, |
+ 0xa6, |
+ 0xe3, |
+ 0x83, |
+ 0xa1, |
+ 0xe3, |
+ 0x83, |
+ 0x9f, |
+ 0xe3, |
+ 0x82, |
+ 0xb7, |
+ 0x20, |
+ 0xe3, |
+ 0x83, |
+ 0xb1, |
+ 0xe3, |
+ 0x83, |
+ 0x92, |
+ 0xe3, |
+ 0x83, |
+ 0xa2, |
+ 0xe3, |
+ 0x82, |
+ 0xbb, |
+ 0xe3, |
+ 0x82, |
+ 0xb9, |
+ 0xe3, |
+ 0x83, |
+ 0xb3 |
+]; |
void main() { |
testUtf8bytesToCodepoints(); |
@@ -121,91 +630,98 @@ List<int> encodeUtf8(String str) => UTF8.encode(str); |
List<int> utf8ToRunes(List<int> codeUnits) { |
return UTF8.decode(codeUnits, allowMalformed: true).runes.toList(); |
} |
+ |
String decodeUtf8(List<int> codeUnits) => UTF8.decode(codeUnits); |
void testEncodeToUtf8() { |
- Expect.listEquals(testEnglishUtf8, encodeUtf8(testEnglishPhrase), |
- "english to utf8"); |
+ Expect.listEquals( |
+ testEnglishUtf8, encodeUtf8(testEnglishPhrase), "english to utf8"); |
- Expect.listEquals(testDanishUtf8, encodeUtf8(testDanishPhrase), |
- "encode danish to utf8"); |
+ Expect.listEquals( |
+ testDanishUtf8, encodeUtf8(testDanishPhrase), "encode danish to utf8"); |
- Expect.listEquals(testHebrewUtf8, encodeUtf8(testHebrewPhrase), |
- "Hebrew to utf8"); |
+ Expect.listEquals( |
+ testHebrewUtf8, encodeUtf8(testHebrewPhrase), "Hebrew to utf8"); |
- Expect.listEquals(testRussianUtf8, encodeUtf8(testRussianPhrase), |
- "Russian to utf8"); |
+ Expect.listEquals( |
+ testRussianUtf8, encodeUtf8(testRussianPhrase), "Russian to utf8"); |
- Expect.listEquals(testGreekUtf8, encodeUtf8(testGreekPhrase), |
- "Greek to utf8"); |
+ Expect.listEquals( |
+ testGreekUtf8, encodeUtf8(testGreekPhrase), "Greek to utf8"); |
- Expect.listEquals(testKatakanaUtf8, encodeUtf8(testKatakanaPhrase), |
- "Katakana to utf8"); |
+ Expect.listEquals( |
+ testKatakanaUtf8, encodeUtf8(testKatakanaPhrase), "Katakana to utf8"); |
} |
void testUtf8bytesToCodepoints() { |
- Expect.listEquals([954, 972, 963, 956, 949], |
- utf8ToRunes([0xce, 0xba, 0xcf, 0x8c, 0xcf, |
- 0x83, 0xce, 0xbc, 0xce, 0xb5]), "κόσμε"); |
+ Expect.listEquals( |
+ [954, 972, 963, 956, 949], |
+ utf8ToRunes([0xce, 0xba, 0xcf, 0x8c, 0xcf, 0x83, 0xce, 0xbc, 0xce, 0xb5]), |
+ "κόσμε"); |
// boundary conditions: First possible sequence of a certain length |
Expect.listEquals([], utf8ToRunes([]), "no input"); |
Expect.listEquals([0x0], utf8ToRunes([0x0]), "0"); |
Expect.listEquals([0x80], utf8ToRunes([0xc2, 0x80]), "80"); |
- Expect.listEquals([0x800], |
- utf8ToRunes([0xe0, 0xa0, 0x80]), "800"); |
- Expect.listEquals([0x10000], |
- utf8ToRunes([0xf0, 0x90, 0x80, 0x80]), "10000"); |
- Expect.listEquals( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xf8, 0x88, 0x80, 0x80, 0x80]), "200000"); |
- Expect.listEquals( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xfc, 0x84, 0x80, 0x80, 0x80, 0x80]), |
- "4000000"); |
+ Expect.listEquals([0x800], utf8ToRunes([0xe0, 0xa0, 0x80]), "800"); |
+ Expect.listEquals([0x10000], utf8ToRunes([0xf0, 0x90, 0x80, 0x80]), "10000"); |
+ Expect.listEquals([ |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE |
+ ], utf8ToRunes([0xf8, 0x88, 0x80, 0x80, 0x80]), "200000"); |
+ Expect.listEquals([ |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE |
+ ], utf8ToRunes([0xfc, 0x84, 0x80, 0x80, 0x80, 0x80]), "4000000"); |
// boundary conditions: Last possible sequence of a certain length |
Expect.listEquals([0x7f], utf8ToRunes([0x7f]), "7f"); |
Expect.listEquals([0x7ff], utf8ToRunes([0xdf, 0xbf]), "7ff"); |
- Expect.listEquals([0xffff], |
- utf8ToRunes([0xef, 0xbf, 0xbf]), "ffff"); |
- Expect.listEquals( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xf7, 0xbf, 0xbf, 0xbf]), "1fffff"); |
- Expect.listEquals( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xfb, 0xbf, 0xbf, 0xbf, 0xbf]), "3ffffff"); |
- Expect.listEquals( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xfd, 0xbf, 0xbf, 0xbf, 0xbf, 0xbf]), |
- "4000000"); |
+ Expect.listEquals([0xffff], utf8ToRunes([0xef, 0xbf, 0xbf]), "ffff"); |
+ Expect.listEquals([ |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE |
+ ], utf8ToRunes([0xf7, 0xbf, 0xbf, 0xbf]), "1fffff"); |
+ Expect.listEquals([ |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE |
+ ], utf8ToRunes([0xfb, 0xbf, 0xbf, 0xbf, 0xbf]), "3ffffff"); |
+ Expect.listEquals([ |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE |
+ ], utf8ToRunes([0xfd, 0xbf, 0xbf, 0xbf, 0xbf, 0xbf]), "4000000"); |
// other boundary conditions |
- Expect.listEquals([0xd7ff], |
- utf8ToRunes([0xed, 0x9f, 0xbf]), "d7ff"); |
- Expect.listEquals([0xe000], |
- utf8ToRunes([0xee, 0x80, 0x80]), "e000"); |
+ Expect.listEquals([0xd7ff], utf8ToRunes([0xed, 0x9f, 0xbf]), "d7ff"); |
+ Expect.listEquals([0xe000], utf8ToRunes([0xee, 0x80, 0x80]), "e000"); |
Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
utf8ToRunes([0xef, 0xbf, 0xbd]), "fffd"); |
- Expect.listEquals([0x10ffff], |
- utf8ToRunes([0xf4, 0x8f, 0xbf, 0xbf]), "10ffff"); |
+ Expect |
+ .listEquals([0x10ffff], utf8ToRunes([0xf4, 0x8f, 0xbf, 0xbf]), "10ffff"); |
Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
utf8ToRunes([0xf4, 0x90, 0x80, 0x80]), "110000"); |
// unexpected continuation bytes |
- Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0x80]), "80 => replacement character"); |
- Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xbf]), "bf => replacement character"); |
+ Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], utf8ToRunes([0x80]), |
+ "80 => replacement character"); |
+ Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], utf8ToRunes([0xbf]), |
+ "bf => replacement character"); |
List<int> allContinuationBytes = <int>[]; |
List<int> matchingReplacementChars = <int>[]; |
@@ -213,228 +729,266 @@ void testUtf8bytesToCodepoints() { |
allContinuationBytes.add(i); |
matchingReplacementChars.add(UNICODE_REPLACEMENT_CHARACTER_RUNE); |
} |
- Expect.listEquals(matchingReplacementChars, |
- utf8ToRunes(allContinuationBytes), |
+ Expect.listEquals(matchingReplacementChars, utf8ToRunes(allContinuationBytes), |
"80 - bf => replacement character x 64"); |
List<int> allFirstTwoByteSeq = <int>[]; |
matchingReplacementChars = <int>[]; |
for (int i = 0xc0; i < 0xe0; i++) { |
allFirstTwoByteSeq.addAll([i, 0x20]); |
- matchingReplacementChars.addAll( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, 0x20]); |
+ matchingReplacementChars.addAll([UNICODE_REPLACEMENT_CHARACTER_RUNE, 0x20]); |
} |
- Expect.listEquals(matchingReplacementChars, |
- utf8ToRunes(allFirstTwoByteSeq), |
+ Expect.listEquals(matchingReplacementChars, utf8ToRunes(allFirstTwoByteSeq), |
"c0 - df + space => replacement character + space x 32"); |
List<int> allFirstThreeByteSeq = <int>[]; |
matchingReplacementChars = <int>[]; |
for (int i = 0xe0; i < 0xf0; i++) { |
allFirstThreeByteSeq.addAll([i, 0x20]); |
- matchingReplacementChars.addAll( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, 0x20]); |
+ matchingReplacementChars.addAll([UNICODE_REPLACEMENT_CHARACTER_RUNE, 0x20]); |
} |
- Expect.listEquals(matchingReplacementChars, |
- utf8ToRunes(allFirstThreeByteSeq), |
+ Expect.listEquals(matchingReplacementChars, utf8ToRunes(allFirstThreeByteSeq), |
"e0 - ef + space => replacement character x 16"); |
List<int> allFirstFourByteSeq = <int>[]; |
matchingReplacementChars = <int>[]; |
for (int i = 0xf0; i < 0xf8; i++) { |
allFirstFourByteSeq.addAll([i, 0x20]); |
- matchingReplacementChars.addAll( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, 0x20]); |
+ matchingReplacementChars.addAll([UNICODE_REPLACEMENT_CHARACTER_RUNE, 0x20]); |
} |
- Expect.listEquals(matchingReplacementChars, |
- utf8ToRunes(allFirstFourByteSeq), |
+ Expect.listEquals(matchingReplacementChars, utf8ToRunes(allFirstFourByteSeq), |
"f0 - f7 + space => replacement character x 8"); |
List<int> allFirstFiveByteSeq = <int>[]; |
matchingReplacementChars = <int>[]; |
for (int i = 0xf8; i < 0xfc; i++) { |
allFirstFiveByteSeq.addAll([i, 0x20]); |
- matchingReplacementChars.addAll( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, 0x20]); |
+ matchingReplacementChars.addAll([UNICODE_REPLACEMENT_CHARACTER_RUNE, 0x20]); |
} |
- Expect.listEquals(matchingReplacementChars, |
- utf8ToRunes(allFirstFiveByteSeq), |
+ Expect.listEquals(matchingReplacementChars, utf8ToRunes(allFirstFiveByteSeq), |
"f8 - fb + space => replacement character x 4"); |
List<int> allFirstSixByteSeq = <int>[]; |
matchingReplacementChars = <int>[]; |
for (int i = 0xfc; i < 0xfe; i++) { |
allFirstSixByteSeq.addAll([i, 0x20]); |
- matchingReplacementChars.addAll( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, 0x20]); |
+ matchingReplacementChars.addAll([UNICODE_REPLACEMENT_CHARACTER_RUNE, 0x20]); |
} |
- Expect.listEquals(matchingReplacementChars, |
- utf8ToRunes(allFirstSixByteSeq), |
+ Expect.listEquals(matchingReplacementChars, utf8ToRunes(allFirstSixByteSeq), |
"fc - fd + space => replacement character x 2"); |
// Sequences with last continuation byte missing |
- Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xc2]), |
+ Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], utf8ToRunes([0xc2]), |
"2-byte sequence with last byte missing"); |
Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xe0, 0x80]), |
- "3-byte sequence with last byte missing"); |
- Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
+ utf8ToRunes([0xe0, 0x80]), "3-byte sequence with last byte missing"); |
+ Expect.listEquals( |
+ [UNICODE_REPLACEMENT_CHARACTER_RUNE], |
utf8ToRunes([0xf0, 0x80, 0x80]), |
"4-byte sequence with last byte missing"); |
- Expect.listEquals( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xf8, 0x88, 0x80, 0x80]), |
+ Expect.listEquals([ |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE |
+ ], utf8ToRunes([0xf8, 0x88, 0x80, 0x80]), |
"5-byte sequence with last byte missing"); |
- Expect.listEquals( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xfc, 0x80, 0x80, 0x80, 0x80]), |
+ Expect.listEquals([ |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE |
+ ], utf8ToRunes([0xfc, 0x80, 0x80, 0x80, 0x80]), |
"6-byte sequence with last byte missing"); |
- Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xdf]), |
+ Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], utf8ToRunes([0xdf]), |
"2-byte sequence with last byte missing (hi)"); |
Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xef, 0xbf]), |
- "3-byte sequence with last byte missing (hi)"); |
- Expect.listEquals( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xf7, 0xbf, 0xbf]), |
+ utf8ToRunes([0xef, 0xbf]), "3-byte sequence with last byte missing (hi)"); |
+ Expect.listEquals([ |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE |
+ ], utf8ToRunes([0xf7, 0xbf, 0xbf]), |
"4-byte sequence with last byte missing (hi)"); |
- Expect.listEquals( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xfb, 0xbf, 0xbf, 0xbf]), |
+ Expect.listEquals([ |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE |
+ ], utf8ToRunes([0xfb, 0xbf, 0xbf, 0xbf]), |
"5-byte sequence with last byte missing (hi)"); |
- Expect.listEquals( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xfd, 0xbf, 0xbf, 0xbf, 0xbf]), |
+ Expect.listEquals([ |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE |
+ ], utf8ToRunes([0xfd, 0xbf, 0xbf, 0xbf, 0xbf]), |
"6-byte sequence with last byte missing (hi)"); |
// Concatenation of incomplete sequences |
Expect.listEquals( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes( |
- [ 0xc2, |
- 0xe0, 0x80, |
- 0xf0, 0x80, 0x80, |
- 0xf8, 0x88, 0x80, 0x80, |
- 0xfc, 0x80, 0x80, 0x80, 0x80, |
- 0xdf, |
- 0xef, 0xbf, |
- 0xf7, 0xbf, 0xbf, |
- 0xfb, 0xbf, 0xbf, 0xbf, |
- 0xfd, 0xbf, 0xbf, 0xbf, 0xbf ]), |
- "Concatenation of incomplete sequences"); |
+ [ |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE |
+ ], |
+ utf8ToRunes([ |
+ 0xc2, |
+ 0xe0, |
+ 0x80, |
+ 0xf0, |
+ 0x80, |
+ 0x80, |
+ 0xf8, |
+ 0x88, |
+ 0x80, |
+ 0x80, |
+ 0xfc, |
+ 0x80, |
+ 0x80, |
+ 0x80, |
+ 0x80, |
+ 0xdf, |
+ 0xef, |
+ 0xbf, |
+ 0xf7, |
+ 0xbf, |
+ 0xbf, |
+ 0xfb, |
+ 0xbf, |
+ 0xbf, |
+ 0xbf, |
+ 0xfd, |
+ 0xbf, |
+ 0xbf, |
+ 0xbf, |
+ 0xbf |
+ ]), |
+ "Concatenation of incomplete sequences"); |
// Impossible bytes |
- Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xfe]), "fe"); |
- Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xff]), "ff"); |
+ Expect.listEquals( |
+ [UNICODE_REPLACEMENT_CHARACTER_RUNE], utf8ToRunes([0xfe]), "fe"); |
+ Expect.listEquals( |
+ [UNICODE_REPLACEMENT_CHARACTER_RUNE], utf8ToRunes([0xff]), "ff"); |
Expect.listEquals([ |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xfe, 0xfe, 0xff, 0xff]), "fe fe ff ff"); |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE |
+ ], utf8ToRunes([0xfe, 0xfe, 0xff, 0xff]), "fe fe ff ff"); |
// Overlong sequences |
- Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xc0, 0xaf]), "c0 af"); |
+ Expect.listEquals( |
+ [UNICODE_REPLACEMENT_CHARACTER_RUNE], utf8ToRunes([0xc0, 0xaf]), "c0 af"); |
Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
utf8ToRunes([0xe0, 0x80, 0xaf]), "e0 80 af"); |
Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
utf8ToRunes([0xf0, 0x80, 0x80, 0xaf]), "f0 80 80 af"); |
- Expect.listEquals( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xf8, 0x80, 0x80, 0x80, 0xaf]), "f8 80 80 80 af"); |
- Expect.listEquals( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xfc, 0x80, 0x80, 0x80, 0x80, 0xaf]), |
- "fc 80 80 80 80 af"); |
+ Expect.listEquals([ |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE |
+ ], utf8ToRunes([0xf8, 0x80, 0x80, 0x80, 0xaf]), "f8 80 80 80 af"); |
+ Expect.listEquals([ |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE |
+ ], utf8ToRunes([0xfc, 0x80, 0x80, 0x80, 0x80, 0xaf]), "fc 80 80 80 80 af"); |
- Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xc1, 0xbf]), "c1 bf"); |
+ Expect.listEquals( |
+ [UNICODE_REPLACEMENT_CHARACTER_RUNE], utf8ToRunes([0xc1, 0xbf]), "c1 bf"); |
Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
utf8ToRunes([0xe0, 0x9f, 0xbf]), "e0 9f bf"); |
Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
utf8ToRunes([0xf0, 0x8f, 0xbf, 0xbf]), "f0 8f bf bf"); |
- Expect.listEquals( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xf8, 0x87, 0xbf, 0xbf, 0xbf]), "f8 87 bf bf bf"); |
- Expect.listEquals( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xfc, 0x83, 0xbf, 0xbf, 0xbf, 0xbf]), |
- "fc 83 bf bf bf bf"); |
+ Expect.listEquals([ |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE |
+ ], utf8ToRunes([0xf8, 0x87, 0xbf, 0xbf, 0xbf]), "f8 87 bf bf bf"); |
+ Expect.listEquals([ |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE |
+ ], utf8ToRunes([0xfc, 0x83, 0xbf, 0xbf, 0xbf, 0xbf]), "fc 83 bf bf bf bf"); |
- Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xc0, 0x80]), "c0 80"); |
+ Expect.listEquals( |
+ [UNICODE_REPLACEMENT_CHARACTER_RUNE], utf8ToRunes([0xc0, 0x80]), "c0 80"); |
Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
utf8ToRunes([0xe0, 0x80, 0x80]), "e0 80 80"); |
Expect.listEquals([UNICODE_REPLACEMENT_CHARACTER_RUNE], |
utf8ToRunes([0xf0, 0x80, 0x80, 0x80]), "f0 80 80 80"); |
- Expect.listEquals( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xf8, 0x80, 0x80, 0x80, 0x80]), "f8 80 80 80 80"); |
- Expect.listEquals( |
- [UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE, |
- UNICODE_REPLACEMENT_CHARACTER_RUNE, UNICODE_REPLACEMENT_CHARACTER_RUNE], |
- utf8ToRunes([0xfc, 0x80, 0x80, 0x80, 0x80, 0x80]), |
- "fc 80 80 80 80 80"); |
+ Expect.listEquals([ |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE |
+ ], utf8ToRunes([0xf8, 0x80, 0x80, 0x80, 0x80]), "f8 80 80 80 80"); |
+ Expect.listEquals([ |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE, |
+ UNICODE_REPLACEMENT_CHARACTER_RUNE |
+ ], utf8ToRunes([0xfc, 0x80, 0x80, 0x80, 0x80, 0x80]), "fc 80 80 80 80 80"); |
// Other illegal code positions (???) |
- Expect.listEquals([0xfffe], utf8ToRunes([0xef, 0xbf, 0xbe]), |
- "U+FFFE"); |
- Expect.listEquals([0xffff], utf8ToRunes([0xef, 0xbf, 0xbf]), |
- "U+FFFF"); |
+ Expect.listEquals([0xfffe], utf8ToRunes([0xef, 0xbf, 0xbe]), "U+FFFE"); |
+ Expect.listEquals([0xffff], utf8ToRunes([0xef, 0xbf, 0xbf]), "U+FFFF"); |
} |
void testUtf8BytesToString() { |
- Expect.stringEquals(testEnglishPhrase, |
- decodeUtf8(testEnglishUtf8), "English"); |
+ Expect.stringEquals( |
+ testEnglishPhrase, decodeUtf8(testEnglishUtf8), "English"); |
- Expect.stringEquals(testDanishPhrase, |
- decodeUtf8(testDanishUtf8), "Danish"); |
+ Expect.stringEquals(testDanishPhrase, decodeUtf8(testDanishUtf8), "Danish"); |
- Expect.stringEquals(testHebrewPhrase, |
- decodeUtf8(testHebrewUtf8), "Hebrew"); |
+ Expect.stringEquals(testHebrewPhrase, decodeUtf8(testHebrewUtf8), "Hebrew"); |
- Expect.stringEquals(testRussianPhrase, |
- decodeUtf8(testRussianUtf8), "Russian"); |
+ Expect.stringEquals( |
+ testRussianPhrase, decodeUtf8(testRussianUtf8), "Russian"); |
- Expect.stringEquals(testGreekPhrase, |
- decodeUtf8(testGreekUtf8), "Greek"); |
+ Expect.stringEquals(testGreekPhrase, decodeUtf8(testGreekUtf8), "Greek"); |
- Expect.stringEquals(testKatakanaPhrase, |
- decodeUtf8(testKatakanaUtf8), "Katakana"); |
+ Expect.stringEquals( |
+ testKatakanaPhrase, decodeUtf8(testKatakanaUtf8), "Katakana"); |
} |