| Index: test/codegen/lib/convert/chunked_conversion_utf88_test.dart
|
| diff --git a/test/codegen/lib/convert/chunked_conversion_utf88_test.dart b/test/codegen/lib/convert/chunked_conversion_utf88_test.dart
|
| new file mode 100644
|
| index 0000000000000000000000000000000000000000..c9a968cbcf52790a4f5cc2956b784e346d5fdc91
|
| --- /dev/null
|
| +++ b/test/codegen/lib/convert/chunked_conversion_utf88_test.dart
|
| @@ -0,0 +1,249 @@
|
| +// Copyright (c) 2013, the Dart project authors. Please see the AUTHORS file
|
| +// for details. All rights reserved. Use of this source code is governed by a
|
| +// BSD-style license that can be found in the LICENSE file.
|
| +
|
| +library utf8_test;
|
| +import "package:expect/expect.dart";
|
| +import 'dart:convert';
|
| +
|
| +List<int> encode(String str) {
|
| + List<int> bytes;
|
| + ChunkedConversionSink byteSink =
|
| + new ByteConversionSink.withCallback((result) => bytes = result);
|
| + var stringConversionSink = new Utf8Encoder().startChunkedConversion(byteSink);
|
| + stringConversionSink.add(str);
|
| + stringConversionSink.close();
|
| + return bytes;
|
| +}
|
| +
|
| +List<int> encode2(String str) {
|
| + List<int> bytes;
|
| + ChunkedConversionSink byteSink =
|
| + new ByteConversionSink.withCallback((result) => bytes = result);
|
| + var stringConversionSink = new Utf8Encoder().startChunkedConversion(byteSink);
|
| + ClosableStringSink stringSink = stringConversionSink.asStringSink();
|
| + stringSink.write(str);
|
| + stringSink.close();
|
| + return bytes;
|
| +}
|
| +
|
| +List<int> encode3(String str) {
|
| + List<int> bytes;
|
| + ChunkedConversionSink byteSink =
|
| + new ByteConversionSink.withCallback((result) => bytes = result);
|
| + var stringConversionSink = new Utf8Encoder().startChunkedConversion(byteSink);
|
| + ClosableStringSink stringSink = stringConversionSink.asStringSink();
|
| + str.codeUnits.forEach(stringSink.writeCharCode);
|
| + stringSink.close();
|
| + return bytes;
|
| +}
|
| +
|
| +List<int> encode4(String str) {
|
| + List<int> bytes;
|
| + ChunkedConversionSink byteSink =
|
| + new ByteConversionSink.withCallback((result) => bytes = result);
|
| + var stringConversionSink = new Utf8Encoder().startChunkedConversion(byteSink);
|
| + ClosableStringSink stringSink = stringConversionSink.asStringSink();
|
| + str.runes.forEach(stringSink.writeCharCode);
|
| + stringSink.close();
|
| + return bytes;
|
| +}
|
| +
|
| +List<int> encode5(String str) {
|
| + List<int> bytes;
|
| + ChunkedConversionSink byteSink =
|
| + new ByteConversionSink.withCallback((result) => bytes = result);
|
| + var stringConversionSink = new Utf8Encoder().startChunkedConversion(byteSink);
|
| + ByteConversionSink inputByteSink = stringConversionSink.asUtf8Sink(false);
|
| + List<int> tmpBytes = UTF8.encode(str);
|
| + inputByteSink.add(tmpBytes);
|
| + inputByteSink.close();
|
| + return bytes;
|
| +}
|
| +
|
| +List<int> encode6(String str) {
|
| + List<int> bytes;
|
| + ChunkedConversionSink byteSink =
|
| + new ByteConversionSink.withCallback((result) => bytes = result);
|
| + var stringConversionSink = new Utf8Encoder().startChunkedConversion(byteSink);
|
| + ByteConversionSink inputByteSink = stringConversionSink.asUtf8Sink(false);
|
| + List<int> tmpBytes = UTF8.encode(str);
|
| + tmpBytes.forEach((b) => inputByteSink.addSlice([0, b, 1], 1, 2, false));
|
| + inputByteSink.close();
|
| + return bytes;
|
| +}
|
| +
|
| +List<int> encode7(String str) {
|
| + List<int> bytes;
|
| + ChunkedConversionSink byteSink =
|
| + new ByteConversionSink.withCallback((result) => bytes = result);
|
| + var stringConversionSink = new Utf8Encoder().startChunkedConversion(byteSink);
|
| + stringConversionSink.addSlice("1" + str + "2", 1, str.length + 1, false);
|
| + stringConversionSink.close();
|
| + return bytes;
|
| +}
|
| +
|
| +
|
| +int _nextPowerOf2(v) {
|
| + assert(v > 0);
|
| + v--;
|
| + v |= v >> 1;
|
| + v |= v >> 2;
|
| + v |= v >> 4;
|
| + v |= v >> 8;
|
| + v |= v >> 16;
|
| + v++;
|
| + return v;
|
| +}
|
| +
|
| +runTest(test) {
|
| + List<int> bytes = test[0];
|
| + String string = test[1];
|
| + Expect.listEquals(bytes, encode(string));
|
| + Expect.listEquals(bytes, encode2(string));
|
| + Expect.listEquals(bytes, encode3(string));
|
| + Expect.listEquals(bytes, encode4(string));
|
| + Expect.listEquals(bytes, encode5(string));
|
| + Expect.listEquals(bytes, encode6(string));
|
| + Expect.listEquals(bytes, encode7(string));
|
| +}
|
| +
|
| +main() {
|
| + const LEADING_SURROGATE = 0xd801;
|
| + const TRAILING_SURROGATE = 0xdc12;
|
| + const UTF8_ENCODING = const [0xf0, 0x90, 0x90, 0x92];
|
| + const UTF8_LEADING = const [0xed, 0xa0, 0x81];
|
| + const UTF8_TRAILING = const [0xed, 0xb0, 0x92];
|
| + const CHAR_A = 0x61;
|
| +
|
| + // Test surrogates at all kinds of locations.
|
| + var tests = [];
|
| + List codeUnits = <int>[];
|
| + for (int i = 0; i < 2049; i++) {
|
| + // Invariant: codeUnits[0..i - 1] is filled with CHAR_A (character 'a').
|
| + codeUnits.length = i + 1;
|
| + codeUnits[i] = CHAR_A;
|
| +
|
| + // Only test for problem zones, close to powers of two.
|
| + if (i > 20 && _nextPowerOf2(i - 2) - i > 10) continue;
|
| +
|
| + codeUnits[i] = LEADING_SURROGATE;
|
| + var str = new String.fromCharCodes(codeUnits);
|
| + var bytes = new List.filled(i + 3, CHAR_A);
|
| + bytes[i] = UTF8_LEADING[0];
|
| + bytes[i + 1] = UTF8_LEADING[1];
|
| + bytes[i + 2] = UTF8_LEADING[2];
|
| + runTest([bytes, str]);
|
| +
|
| + codeUnits[i] = TRAILING_SURROGATE;
|
| + str = new String.fromCharCodes(codeUnits);
|
| + bytes = new List.filled(i + 3, CHAR_A);
|
| + bytes[i] = UTF8_TRAILING[0];
|
| + bytes[i + 1] = UTF8_TRAILING[1];
|
| + bytes[i + 2] = UTF8_TRAILING[2];
|
| + runTest([bytes, str]);
|
| +
|
| + codeUnits.length = i + 2;
|
| + codeUnits[i] = LEADING_SURROGATE;
|
| + codeUnits[i + 1] = TRAILING_SURROGATE;
|
| + str = new String.fromCharCodes(codeUnits);
|
| + bytes = new List.filled(i + 4, CHAR_A);
|
| + bytes[i] = UTF8_ENCODING[0];
|
| + bytes[i + 1] = UTF8_ENCODING[1];
|
| + bytes[i + 2] = UTF8_ENCODING[2];
|
| + bytes[i + 3] = UTF8_ENCODING[3];
|
| + runTest([bytes, str]);
|
| +
|
| + codeUnits[i] = TRAILING_SURROGATE;
|
| + codeUnits[i + 1] = TRAILING_SURROGATE;
|
| + str = new String.fromCharCodes(codeUnits);
|
| + bytes = new List.filled(i + 6, CHAR_A);
|
| + bytes[i] = UTF8_TRAILING[0];
|
| + bytes[i + 1] = UTF8_TRAILING[1];
|
| + bytes[i + 2] = UTF8_TRAILING[2];
|
| + bytes[i + 3] = UTF8_TRAILING[0];
|
| + bytes[i + 4] = UTF8_TRAILING[1];
|
| + bytes[i + 5] = UTF8_TRAILING[2];
|
| + runTest([bytes, str]);
|
| +
|
| + codeUnits[i] = LEADING_SURROGATE;
|
| + codeUnits[i + 1] = LEADING_SURROGATE;
|
| + str = new String.fromCharCodes(codeUnits);
|
| + bytes = new List.filled(i + 6, CHAR_A);
|
| + bytes[i] = UTF8_LEADING[0];
|
| + bytes[i + 1] = UTF8_LEADING[1];
|
| + bytes[i + 2] = UTF8_LEADING[2];
|
| + bytes[i + 3] = UTF8_LEADING[0];
|
| + bytes[i + 4] = UTF8_LEADING[1];
|
| + bytes[i + 5] = UTF8_LEADING[2];
|
| + runTest([bytes, str]);
|
| +
|
| + codeUnits[i] = TRAILING_SURROGATE;
|
| + codeUnits[i + 1] = LEADING_SURROGATE;
|
| + str = new String.fromCharCodes(codeUnits);
|
| + bytes = new List.filled(i + 6, CHAR_A);
|
| + bytes[i] = UTF8_TRAILING[0];
|
| + bytes[i + 1] = UTF8_TRAILING[1];
|
| + bytes[i + 2] = UTF8_TRAILING[2];
|
| + bytes[i + 3] = UTF8_LEADING[0];
|
| + bytes[i + 4] = UTF8_LEADING[1];
|
| + bytes[i + 5] = UTF8_LEADING[2];
|
| + runTest([bytes, str]);
|
| +
|
| + codeUnits.length = i + 3;
|
| + codeUnits[i] = LEADING_SURROGATE;
|
| + codeUnits[i + 1] = TRAILING_SURROGATE;
|
| + codeUnits[i + 2] = CHAR_A; // Add trailing 'a'.
|
| + str = new String.fromCharCodes(codeUnits);
|
| + bytes = new List.filled(i + 5, CHAR_A);
|
| + bytes[i] = UTF8_ENCODING[0];
|
| + bytes[i + 1] = UTF8_ENCODING[1];
|
| + bytes[i + 2] = UTF8_ENCODING[2];
|
| + bytes[i + 3] = UTF8_ENCODING[3];
|
| + // No need to assign the 'a' character. The whole list is already filled
|
| + // with it.
|
| + runTest([bytes, str]);
|
| +
|
| + codeUnits[i] = TRAILING_SURROGATE;
|
| + codeUnits[i + 1] = TRAILING_SURROGATE;
|
| + codeUnits[i + 2] = CHAR_A; // Add trailing 'a'.
|
| + str = new String.fromCharCodes(codeUnits);
|
| + bytes = new List.filled(i + 7, CHAR_A);
|
| + bytes[i] = UTF8_TRAILING[0];
|
| + bytes[i + 1] = UTF8_TRAILING[1];
|
| + bytes[i + 2] = UTF8_TRAILING[2];
|
| + bytes[i + 3] = UTF8_TRAILING[0];
|
| + bytes[i + 4] = UTF8_TRAILING[1];
|
| + bytes[i + 5] = UTF8_TRAILING[2];
|
| + runTest([bytes, str]);
|
| +
|
| + codeUnits[i] = LEADING_SURROGATE;
|
| + codeUnits[i + 1] = LEADING_SURROGATE;
|
| + codeUnits[i + 2] = CHAR_A; // Add trailing 'a'.
|
| + str = new String.fromCharCodes(codeUnits);
|
| + bytes = new List.filled(i + 7, CHAR_A);
|
| + bytes[i] = UTF8_LEADING[0];
|
| + bytes[i + 1] = UTF8_LEADING[1];
|
| + bytes[i + 2] = UTF8_LEADING[2];
|
| + bytes[i + 3] = UTF8_LEADING[0];
|
| + bytes[i + 4] = UTF8_LEADING[1];
|
| + bytes[i + 5] = UTF8_LEADING[2];
|
| + runTest([bytes, str]);
|
| +
|
| + codeUnits[i] = TRAILING_SURROGATE;
|
| + codeUnits[i + 1] = LEADING_SURROGATE;
|
| + codeUnits[i + 2] = CHAR_A; // Add trailing 'a'.
|
| + str = new String.fromCharCodes(codeUnits);
|
| + bytes = new List.filled(i + 7, CHAR_A);
|
| + bytes[i] = UTF8_TRAILING[0];
|
| + bytes[i + 1] = UTF8_TRAILING[1];
|
| + bytes[i + 2] = UTF8_TRAILING[2];
|
| + bytes[i + 3] = UTF8_LEADING[0];
|
| + bytes[i + 4] = UTF8_LEADING[1];
|
| + bytes[i + 5] = UTF8_LEADING[2];
|
| + runTest([bytes, str]);
|
| +
|
| + // Make sure the invariant is correct.
|
| + codeUnits[i] = CHAR_A;
|
| + }
|
| +}
|
|
|