Index: source/test/cintltst/custrtrn.c |
diff --git a/source/test/cintltst/custrtrn.c b/source/test/cintltst/custrtrn.c |
deleted file mode 100644 |
index cc6d060f1964dfab6e3756ddf63befc966841401..0000000000000000000000000000000000000000 |
--- a/source/test/cintltst/custrtrn.c |
+++ /dev/null |
@@ -1,2121 +0,0 @@ |
-/******************************************************************** |
- * COPYRIGHT: |
- * Copyright (c) 2001-2014, International Business Machines Corporation and |
- * others. All Rights Reserved. |
- ********************************************************************/ |
-/******************************************************************************** |
-* |
-* File custrtrn.C |
-* |
-* Modification History: |
-* Name Description |
-* Ram String transformations test |
-********************************************************************************* |
-*/ |
-/****************************************************************************/ |
- |
- |
-#include <stdlib.h> |
-#include <stdio.h> |
-#include <string.h> |
-#include "unicode/utypes.h" |
-#include "unicode/ustring.h" |
-#include "unicode/ures.h" |
-#include "ustr_imp.h" |
-#include "cintltst.h" |
-#include "cmemory.h" |
-#include "cstring.h" |
-#include "cwchar.h" |
- |
-void addUCharTransformTest(TestNode** root); |
- |
-static void Test_strToUTF32(void); |
-static void Test_strToUTF32_surrogates(void); |
-static void Test_strFromUTF32(void); |
-static void Test_strFromUTF32_surrogates(void); |
-static void Test_UChar_UTF8_API(void); |
-static void Test_FromUTF8(void); |
-static void Test_FromUTF8Lenient(void); |
-static void Test_UChar_WCHART_API(void); |
-static void Test_widestrs(void); |
-static void Test_WCHART_LongString(void); |
-static void Test_strToJavaModifiedUTF8(void); |
-static void Test_strFromJavaModifiedUTF8(void); |
-static void TestNullEmptySource(void); |
- |
-void |
-addUCharTransformTest(TestNode** root) |
-{ |
- addTest(root, &Test_strToUTF32, "custrtrn/Test_strToUTF32"); |
- addTest(root, &Test_strToUTF32_surrogates, "custrtrn/Test_strToUTF32_surrogates"); |
- addTest(root, &Test_strFromUTF32, "custrtrn/Test_strFromUTF32"); |
- addTest(root, &Test_strFromUTF32_surrogates, "custrtrn/Test_strFromUTF32_surrogates"); |
- addTest(root, &Test_UChar_UTF8_API, "custrtrn/Test_UChar_UTF8_API"); |
- addTest(root, &Test_FromUTF8, "custrtrn/Test_FromUTF8"); |
- addTest(root, &Test_FromUTF8Lenient, "custrtrn/Test_FromUTF8Lenient"); |
- addTest(root, &Test_UChar_WCHART_API, "custrtrn/Test_UChar_WCHART_API"); |
- addTest(root, &Test_widestrs, "custrtrn/Test_widestrs"); |
-#if !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION |
- addTest(root, &Test_WCHART_LongString, "custrtrn/Test_WCHART_LongString"); |
-#endif |
- addTest(root, &Test_strToJavaModifiedUTF8, "custrtrn/Test_strToJavaModifiedUTF8"); |
- addTest(root, &Test_strFromJavaModifiedUTF8, "custrtrn/Test_strFromJavaModifiedUTF8"); |
- addTest(root, &TestNullEmptySource, "custrtrn/TestNullEmptySource"); |
-} |
- |
-static const UChar32 src32[]={ |
- 0x00A8, 0x3003, 0x3005, 0x2015, 0xFF5E, 0x2016, 0x2026, 0x2018, 0x000D, 0x000A, |
- 0x2019, 0x201C, 0x201D, 0x3014, 0x3015, 0x3008, 0x3009, 0x300A, 0x000D, 0x000A, |
- 0x300B, 0x300C, 0x300D, 0x300E, 0x300F, 0x3016, 0x3017, 0x3010, 0x000D, 0x000A, |
- 0x3011, 0x00B1, 0x00D7, 0x00F7, 0x2236, 0x2227, 0x7FC1, 0x8956, 0x000D, 0x000A, |
- 0x9D2C, 0x9D0E, 0x9EC4, 0x5CA1, 0x6C96, 0x837B, 0x5104, 0x5C4B, 0x000D, 0x000A, |
- 0x61B6, 0x81C6, 0x6876, 0x7261, 0x4E59, 0x4FFA, 0x5378, 0x57F7, 0x000D, 0x000A, |
- 0x57F4, 0x57F9, 0x57FA, 0x57FC, 0x5800, 0x5802, 0x5805, 0x5806, 0x000D, 0x000A, |
- 0x580A, 0x581E, 0x6BB5, 0x6BB7, 0x6BBA, 0x6BBC, 0x9CE2, 0x977C, 0x000D, 0x000A, |
- 0x6BBF, 0x6BC1, 0x6BC5, 0x6BC6, 0x6BCB, 0x6BCD, 0x6BCF, 0x6BD2, 0x000D, 0x000A, |
- 0x6BD3, 0x6BD4, 0x6BD6, 0x6BD7, 0x6BD8, 0x6BDB, 0x6BEB, 0x6BEC, 0x000D, 0x000A, |
- 0x6C05, 0x6C08, 0x6C0F, 0x6C11, 0x6C13, 0x6C23, 0x6C34, 0x0041, 0x000D, 0x000A, |
- 0x0043, 0x0044, 0x0045, 0x0046, 0x0047, 0x0048, 0x0049, 0x004A, 0x000D, 0x000A, |
- 0x004B, 0x004C, 0x004D, 0x004E, 0x004F, 0x0050, 0x0051, 0x0052, 0x000D, 0x000A, |
- 0x0053, 0x0054, 0x0055, 0x0056, 0x0057, 0x0058, 0x0059, 0x005A, 0x000D, 0x000A, |
- 0x005B, 0x9792, 0x9CCC, 0x9CCD, 0x9CCE, 0x9CCF, 0x9CD0, 0x9CD3, 0x000D, 0x000A, |
- 0x9CD4, 0x9CD5, 0x9CD7, 0x9CD8, 0x9CD9, 0x9CDC, 0x9CDD, 0x9CDF, 0x000D, 0x000A, |
- 0x9785, 0x9791, 0x00BD, 0x0390, 0x0385, 0x0386, 0x0388, 0x0389, 0x000D, 0x000A, |
- 0x038E, 0x038F, 0x0390, 0x0391, 0x0392, 0x0393, 0x0394, 0x0395, 0x000D, 0x000A, |
- 0x0396, 0x0397, 0x0398, 0x0399, 0x039A, 0x038A, 0x038C, 0x039C, 0x000D, 0x000A, |
- /* test non-BMP code points */ |
- 0x0002A699, |
- 0x0002A69C, 0x0002A69D, 0x0002A69E, 0x0002A69F, 0x0002A6A0, 0x0002A6A5, 0x0002A6A6, 0x0002A6A7, 0x0002A6A8, 0x0002A6AB, |
- 0x0002A6AC, 0x0002A6AD, 0x0002A6AE, 0x0002A6AF, 0x0002A6B0, 0x0002A6B1, 0x0002A6B3, 0x0002A6B5, 0x0002A6B6, 0x0002A6B7, |
- 0x0002A6B8, 0x0002A6B9, 0x0002A6BA, 0x0002A6BB, 0x0002A6BC, 0x0002A6BD, 0x0002A6BE, 0x0002A6BF, 0x0002A6C0, 0x0002A6C1, |
- 0x0002A6C2, 0x0002A6C3, 0x0002A6C4, 0x0002A6C8, 0x0002A6CA, 0x0002A6CB, 0x0002A6CD, 0x0002A6CE, 0x0002A6CF, 0x0002A6D0, |
- 0x0002A6D1, 0x0002A6D2, 0x0002A6D3, 0x0002A6D4, 0x0002A6D5, |
- |
- 0x4DB3, 0x4DB4, 0x4DB5, 0x4E00, 0x4E00, 0x4E01, 0x4E02, 0x4E03, 0x000D, 0x000A, |
- 0x0392, 0x0393, 0x0394, 0x0395, 0x0396, 0x0397, 0x33E0, 0x33E6, 0x000D, 0x000A, |
- 0x4E05, 0x4E07, 0x4E04, 0x4E08, 0x4E08, 0x4E09, 0x4E0A, 0x4E0B, 0x000D, 0x000A, |
- 0x4E0C, 0x0021, 0x0022, 0x0023, 0x0024, 0xFF40, 0xFF41, 0xFF42, 0x000D, 0x000A, |
- 0xFF43, 0xFF44, 0xFF45, 0xFF46, 0xFF47, 0xFF48, 0xFF49, 0xFF4A, 0x000D, 0x000A,0x0000 |
-}; |
- |
-static const UChar src16[] = { |
- 0x00A8, 0x3003, 0x3005, 0x2015, 0xFF5E, 0x2016, 0x2026, 0x2018, 0x000D, 0x000A, |
- 0x2019, 0x201C, 0x201D, 0x3014, 0x3015, 0x3008, 0x3009, 0x300A, 0x000D, 0x000A, |
- 0x300B, 0x300C, 0x300D, 0x300E, 0x300F, 0x3016, 0x3017, 0x3010, 0x000D, 0x000A, |
- 0x3011, 0x00B1, 0x00D7, 0x00F7, 0x2236, 0x2227, 0x7FC1, 0x8956, 0x000D, 0x000A, |
- 0x9D2C, 0x9D0E, 0x9EC4, 0x5CA1, 0x6C96, 0x837B, 0x5104, 0x5C4B, 0x000D, 0x000A, |
- 0x61B6, 0x81C6, 0x6876, 0x7261, 0x4E59, 0x4FFA, 0x5378, 0x57F7, 0x000D, 0x000A, |
- 0x57F4, 0x57F9, 0x57FA, 0x57FC, 0x5800, 0x5802, 0x5805, 0x5806, 0x000D, 0x000A, |
- 0x580A, 0x581E, 0x6BB5, 0x6BB7, 0x6BBA, 0x6BBC, 0x9CE2, 0x977C, 0x000D, 0x000A, |
- 0x6BBF, 0x6BC1, 0x6BC5, 0x6BC6, 0x6BCB, 0x6BCD, 0x6BCF, 0x6BD2, 0x000D, 0x000A, |
- 0x6BD3, 0x6BD4, 0x6BD6, 0x6BD7, 0x6BD8, 0x6BDB, 0x6BEB, 0x6BEC, 0x000D, 0x000A, |
- 0x6C05, 0x6C08, 0x6C0F, 0x6C11, 0x6C13, 0x6C23, 0x6C34, 0x0041, 0x000D, 0x000A, |
- 0x0043, 0x0044, 0x0045, 0x0046, 0x0047, 0x0048, 0x0049, 0x004A, 0x000D, 0x000A, |
- 0x004B, 0x004C, 0x004D, 0x004E, 0x004F, 0x0050, 0x0051, 0x0052, 0x000D, 0x000A, |
- 0x0053, 0x0054, 0x0055, 0x0056, 0x0057, 0x0058, 0x0059, 0x005A, 0x000D, 0x000A, |
- 0x005B, 0x9792, 0x9CCC, 0x9CCD, 0x9CCE, 0x9CCF, 0x9CD0, 0x9CD3, 0x000D, 0x000A, |
- 0x9CD4, 0x9CD5, 0x9CD7, 0x9CD8, 0x9CD9, 0x9CDC, 0x9CDD, 0x9CDF, 0x000D, 0x000A, |
- 0x9785, 0x9791, 0x00BD, 0x0390, 0x0385, 0x0386, 0x0388, 0x0389, 0x000D, 0x000A, |
- 0x038E, 0x038F, 0x0390, 0x0391, 0x0392, 0x0393, 0x0394, 0x0395, 0x000D, 0x000A, |
- 0x0396, 0x0397, 0x0398, 0x0399, 0x039A, 0x038A, 0x038C, 0x039C, 0x000D, 0x000A, |
- |
- /* test non-BMP code points */ |
- 0xD869, 0xDE99, 0xD869, 0xDE9C, 0xD869, 0xDE9D, 0xD869, 0xDE9E, 0xD869, 0xDE9F, |
- 0xD869, 0xDEA0, 0xD869, 0xDEA5, 0xD869, 0xDEA6, 0xD869, 0xDEA7, 0xD869, 0xDEA8, |
- 0xD869, 0xDEAB, 0xD869, 0xDEAC, 0xD869, 0xDEAD, 0xD869, 0xDEAE, 0xD869, 0xDEAF, |
- 0xD869, 0xDEB0, 0xD869, 0xDEB1, 0xD869, 0xDEB3, 0xD869, 0xDEB5, 0xD869, 0xDEB6, |
- 0xD869, 0xDEB7, 0xD869, 0xDEB8, 0xD869, 0xDEB9, 0xD869, 0xDEBA, 0xD869, 0xDEBB, |
- 0xD869, 0xDEBC, 0xD869, 0xDEBD, 0xD869, 0xDEBE, 0xD869, 0xDEBF, 0xD869, 0xDEC0, |
- 0xD869, 0xDEC1, 0xD869, 0xDEC2, 0xD869, 0xDEC3, 0xD869, 0xDEC4, 0xD869, 0xDEC8, |
- 0xD869, 0xDECA, 0xD869, 0xDECB, 0xD869, 0xDECD, 0xD869, 0xDECE, 0xD869, 0xDECF, |
- 0xD869, 0xDED0, 0xD869, 0xDED1, 0xD869, 0xDED2, 0xD869, 0xDED3, 0xD869, 0xDED4, |
- 0xD869, 0xDED5, |
- |
- 0x4DB3, 0x4DB4, 0x4DB5, 0x4E00, 0x4E00, 0x4E01, 0x4E02, 0x4E03, 0x000D, 0x000A, |
- 0x0392, 0x0393, 0x0394, 0x0395, 0x0396, 0x0397, 0x33E0, 0x33E6, 0x000D, 0x000A, |
- 0x4E05, 0x4E07, 0x4E04, 0x4E08, 0x4E08, 0x4E09, 0x4E0A, 0x4E0B, 0x000D, 0x000A, |
- 0x4E0C, 0x0021, 0x0022, 0x0023, 0x0024, 0xFF40, 0xFF41, 0xFF42, 0x000D, 0x000A, |
- 0xFF43, 0xFF44, 0xFF45, 0xFF46, 0xFF47, 0xFF48, 0xFF49, 0xFF4A, 0x000D, 0x000A,0x0000 |
-}; |
- |
- |
-static void Test_strToUTF32(void){ |
- UErrorCode err = U_ZERO_ERROR; |
- UChar32 u32Target[400]; |
- int32_t u32DestLen; |
- int i= 0; |
- |
- /* first with length */ |
- u32DestLen = -2; |
- u_strToUTF32(u32Target, 0, &u32DestLen, src16, UPRV_LENGTHOF(src16),&err); |
- if(err != U_BUFFER_OVERFLOW_ERROR || u32DestLen != UPRV_LENGTHOF(src32)) { |
- log_err("u_strToUTF32(preflight with length): " |
- "length %ld != %ld and %s != U_BUFFER_OVERFLOW_ERROR\n", |
- (long)u32DestLen, (long)UPRV_LENGTHOF(src32), u_errorName(err)); |
- return; |
- } |
- err = U_ZERO_ERROR; |
- u32DestLen = -2; |
- u_strToUTF32(u32Target, UPRV_LENGTHOF(src32)+1, &u32DestLen, src16, UPRV_LENGTHOF(src16),&err); |
- if(err != U_ZERO_ERROR || u32DestLen != UPRV_LENGTHOF(src32)) { |
- log_err("u_strToUTF32(with length): " |
- "length %ld != %ld and %s != U_ZERO_ERROR\n", |
- (long)u32DestLen, (long)UPRV_LENGTHOF(src32), u_errorName(err)); |
- return; |
- } |
- /*for(i=0; i< u32DestLen; i++){ |
- printf("0x%08X, ",uTarget[i]); |
- if(i%10==0){ |
- printf("\n"); |
- } |
- }*/ |
- for(i=0; i< UPRV_LENGTHOF(src32); i++){ |
- if(u32Target[i] != src32[i]){ |
- log_verbose("u_strToUTF32(with length) failed expected: %04X got: %04X at index: %i \n", src32[i], u32Target[i],i); |
- } |
- } |
- if(u32Target[i] != 0){ |
- log_verbose("u_strToUTF32(with length) failed expected: %04X got: %04X at index: %i \n", 0, u32Target[i],i); |
- } |
- |
- /* now NUL-terminated */ |
- u32DestLen = -2; |
- u_strToUTF32(NULL,0, &u32DestLen, src16, -1,&err); |
- if(err != U_BUFFER_OVERFLOW_ERROR || u32DestLen != UPRV_LENGTHOF(src32)-1) { |
- log_err("u_strToUTF32(preflight with NUL-termination): " |
- "length %ld != %ld and %s != U_BUFFER_OVERFLOW_ERROR\n", |
- (long)u32DestLen, (long)UPRV_LENGTHOF(src32)-1, u_errorName(err)); |
- return; |
- } |
- err = U_ZERO_ERROR; |
- u32DestLen = -2; |
- u_strToUTF32(u32Target, UPRV_LENGTHOF(src32), &u32DestLen, src16, -1,&err); |
- if(err != U_ZERO_ERROR || u32DestLen != UPRV_LENGTHOF(src32)-1) { |
- log_err("u_strToUTF32(with NUL-termination): " |
- "length %ld != %ld and %s != U_ZERO_ERROR\n", |
- (long)u32DestLen, (long)UPRV_LENGTHOF(src32)-1, u_errorName(err)); |
- return; |
- } |
- |
- for(i=0; i< UPRV_LENGTHOF(src32); i++){ |
- if(u32Target[i] != src32[i]){ |
- log_verbose("u_strToUTF32(NUL-termination) failed expected: %04X got: %04X \n", src32[i], u32Target[i]); |
- } |
- } |
-} |
- |
-/* test unpaired surrogates */ |
-static void Test_strToUTF32_surrogates() { |
- UErrorCode err = U_ZERO_ERROR; |
- UChar32 u32Target[400]; |
- int32_t len16, u32DestLen; |
- int32_t numSubstitutions; |
- int i; |
- |
- static const UChar surr16[] = { 0x41, 0xd900, 0x61, 0xdc00, 0x5a, 0xd900, 0xdc00, 0x7a, 0 }; |
- static const UChar32 expected[] = { 0x5a, 0x50000, 0x7a, 0 }; |
- static const UChar32 expected_FFFD[] = { 0x41, 0xfffd, 0x61, 0xfffd, 0x5a, 0x50000, 0x7a, 0 }; |
- static const UChar32 expected_12345[] = { 0x41, 0x12345, 0x61, 0x12345, 0x5a, 0x50000, 0x7a, 0 }; |
- len16 = UPRV_LENGTHOF(surr16); |
- for(i = 0; i < 4; ++i) { |
- err = U_ZERO_ERROR; |
- u_strToUTF32(u32Target, 0, &u32DestLen, surr16+i, len16-i, &err); |
- if(err != U_INVALID_CHAR_FOUND) { |
- log_err("u_strToUTF32(preflight surr16+%ld) sets %s != U_INVALID_CHAR_FOUND\n", |
- (long)i, u_errorName(err)); |
- return; |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strToUTF32(u32Target, UPRV_LENGTHOF(u32Target), &u32DestLen, surr16+i, len16-i, &err); |
- if(err != U_INVALID_CHAR_FOUND) { |
- log_err("u_strToUTF32(surr16+%ld) sets %s != U_INVALID_CHAR_FOUND\n", |
- (long)i, u_errorName(err)); |
- return; |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strToUTF32(NULL, 0, &u32DestLen, surr16+i, -1, &err); |
- if(err != U_INVALID_CHAR_FOUND) { |
- log_err("u_strToUTF32(preflight surr16+%ld/NUL) sets %s != U_INVALID_CHAR_FOUND\n", |
- (long)i, u_errorName(err)); |
- return; |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strToUTF32(u32Target, UPRV_LENGTHOF(u32Target), &u32DestLen, surr16+i, -1, &err); |
- if(err != U_INVALID_CHAR_FOUND) { |
- log_err("u_strToUTF32(surr16+%ld/NUL) sets %s != U_INVALID_CHAR_FOUND\n", |
- (long)i, u_errorName(err)); |
- return; |
- } |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strToUTF32(u32Target, 0, &u32DestLen, surr16+4, len16-4-1, &err); |
- if(err != U_BUFFER_OVERFLOW_ERROR || u32DestLen != 3) { |
- log_err("u_strToUTF32(preflight surr16+4) sets %s != U_BUFFER_OVERFLOW_ERROR or an unexpected length\n", |
- u_errorName(err)); |
- return; |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strToUTF32(u32Target, UPRV_LENGTHOF(u32Target), &u32DestLen, surr16+4, len16-4-1, &err); |
- if(err != U_ZERO_ERROR || u32DestLen != 3 || uprv_memcmp(u32Target, expected, 4*4)) { |
- log_err("u_strToUTF32(surr16+4) sets %s != U_ZERO_ERROR or does not produce the expected string\n", |
- u_errorName(err)); |
- return; |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strToUTF32(NULL, 0, &u32DestLen, surr16+4, -1, &err); |
- if(err != U_BUFFER_OVERFLOW_ERROR || u32DestLen != 3) { |
- log_err("u_strToUTF32(preflight surr16+4/NUL) sets %s != U_BUFFER_OVERFLOW_ERROR or an unexpected length\n", |
- u_errorName(err)); |
- return; |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strToUTF32(u32Target, UPRV_LENGTHOF(u32Target), &u32DestLen, surr16+4, -1, &err); |
- if(err != U_ZERO_ERROR || u32DestLen != 3 || uprv_memcmp(u32Target, expected, 4*4)) { |
- log_err("u_strToUTF32(surr16+4/NUL) sets %s != U_ZERO_ERROR or does not produce the expected string\n", |
- u_errorName(err)); |
- return; |
- } |
- |
- /* with substitution character */ |
- numSubstitutions = -1; |
- err = U_ZERO_ERROR; |
- u_strToUTF32WithSub(u32Target, 0, &u32DestLen, surr16, len16-1, 0xfffd, &numSubstitutions, &err); |
- if(err != U_BUFFER_OVERFLOW_ERROR || u32DestLen != 7 || numSubstitutions != 2) { |
- log_err("u_strToUTF32WithSub(preflight surr16) sets %s != U_BUFFER_OVERFLOW_ERROR or an unexpected length\n", |
- u_errorName(err)); |
- return; |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strToUTF32WithSub(u32Target, UPRV_LENGTHOF(u32Target), &u32DestLen, surr16, len16-1, 0xfffd, &numSubstitutions, &err); |
- if(err != U_ZERO_ERROR || u32DestLen != 7 || numSubstitutions != 2 || uprv_memcmp(u32Target, expected_FFFD, 8*4)) { |
- log_err("u_strToUTF32WithSub(surr16) sets %s != U_ZERO_ERROR or does not produce the expected string\n", |
- u_errorName(err)); |
- return; |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strToUTF32WithSub(NULL, 0, &u32DestLen, surr16, -1, 0x12345, &numSubstitutions, &err); |
- if(err != U_BUFFER_OVERFLOW_ERROR || u32DestLen != 7 || numSubstitutions != 2) { |
- log_err("u_strToUTF32WithSub(preflight surr16/NUL) sets %s != U_BUFFER_OVERFLOW_ERROR or an unexpected length\n", |
- u_errorName(err)); |
- return; |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strToUTF32WithSub(u32Target, UPRV_LENGTHOF(u32Target), &u32DestLen, surr16, -1, 0x12345, &numSubstitutions, &err); |
- if(err != U_ZERO_ERROR || u32DestLen != 7 || numSubstitutions != 2 || uprv_memcmp(u32Target, expected_12345, 8*4)) { |
- log_err("u_strToUTF32WithSub(surr16/NUL) sets %s != U_ZERO_ERROR or does not produce the expected string\n", |
- u_errorName(err)); |
- return; |
- } |
-} |
- |
-static void Test_strFromUTF32(void){ |
- UErrorCode err = U_ZERO_ERROR; |
- UChar uTarget[400]; |
- int32_t uDestLen; |
- int i= 0; |
- |
- /* first with length */ |
- uDestLen = -2; |
- u_strFromUTF32(uTarget,0,&uDestLen,src32,UPRV_LENGTHOF(src32),&err); |
- if(err != U_BUFFER_OVERFLOW_ERROR || uDestLen != UPRV_LENGTHOF(src16)) { |
- log_err("u_strFromUTF32(preflight with length): " |
- "length %ld != %ld and %s != U_BUFFER_OVERFLOW_ERROR\n", |
- (long)uDestLen, (long)UPRV_LENGTHOF(src16), u_errorName(err)); |
- return; |
- } |
- err = U_ZERO_ERROR; |
- uDestLen = -2; |
- u_strFromUTF32(uTarget, UPRV_LENGTHOF(src16)+1,&uDestLen,src32,UPRV_LENGTHOF(src32),&err); |
- if(err != U_ZERO_ERROR || uDestLen != UPRV_LENGTHOF(src16)) { |
- log_err("u_strFromUTF32(with length): " |
- "length %ld != %ld and %s != U_ZERO_ERROR\n", |
- (long)uDestLen, (long)UPRV_LENGTHOF(src16), u_errorName(err)); |
- return; |
- } |
- /*for(i=0; i< uDestLen; i++){ |
- printf("0x%04X, ",uTarget[i]); |
- if(i%10==0){ |
- printf("\n"); |
- } |
- }*/ |
- |
- for(i=0; i< uDestLen; i++){ |
- if(uTarget[i] != src16[i]){ |
- log_verbose("u_strFromUTF32(with length) failed expected: %04X got: %04X at index: %i \n", src16[i] ,uTarget[i],i); |
- } |
- } |
- if(uTarget[i] != 0){ |
- log_verbose("u_strFromUTF32(with length) failed expected: %04X got: %04X at index: %i \n", 0,uTarget[i],i); |
- } |
- |
- /* now NUL-terminated */ |
- uDestLen = -2; |
- u_strFromUTF32(NULL,0,&uDestLen,src32,-1,&err); |
- if(err != U_BUFFER_OVERFLOW_ERROR || uDestLen != UPRV_LENGTHOF(src16)-1) { |
- log_err("u_strFromUTF32(preflight with NUL-termination): " |
- "length %ld != %ld and %s != U_BUFFER_OVERFLOW_ERROR\n", |
- (long)uDestLen, (long)UPRV_LENGTHOF(src16)-1, u_errorName(err)); |
- return; |
- } |
- err = U_ZERO_ERROR; |
- uDestLen = -2; |
- u_strFromUTF32(uTarget, UPRV_LENGTHOF(src16),&uDestLen,src32,-1,&err); |
- if(err != U_ZERO_ERROR || uDestLen != UPRV_LENGTHOF(src16)-1) { |
- log_err("u_strFromUTF32(with NUL-termination): " |
- "length %ld != %ld and %s != U_ZERO_ERROR\n", |
- (long)uDestLen, (long)UPRV_LENGTHOF(src16)-1, u_errorName(err)); |
- return; |
- } |
- |
- for(i=0; i< uDestLen; i++){ |
- if(uTarget[i] != src16[i]){ |
- log_verbose("u_strFromUTF32(with NUL-termination) failed expected: %04X got: %04X \n", src16[i] ,uTarget[i]); |
- } |
- } |
-} |
- |
-/* test surrogate code points */ |
-static void Test_strFromUTF32_surrogates() { |
- UErrorCode err = U_ZERO_ERROR; |
- UChar uTarget[400]; |
- int32_t len32, uDestLen; |
- int32_t numSubstitutions; |
- int i; |
- |
- static const UChar32 surr32[] = { 0x41, 0xd900, 0x61, 0xdc00, -1, 0x110000, 0x5a, 0x50000, 0x7a, 0 }; |
- static const UChar expected[] = { 0x5a, 0xd900, 0xdc00, 0x7a, 0 }; |
- static const UChar expected_FFFD[] = { 0x41, 0xfffd, 0x61, 0xfffd, 0xfffd, 0xfffd, 0x5a, 0xd900, 0xdc00, 0x7a, 0 }; |
- static const UChar expected_12345[] = { 0x41, 0xd808, 0xdf45, 0x61, 0xd808, 0xdf45, 0xd808, 0xdf45, 0xd808, 0xdf45, |
- 0x5a, 0xd900, 0xdc00, 0x7a, 0 }; |
- len32 = UPRV_LENGTHOF(surr32); |
- for(i = 0; i < 6; ++i) { |
- err = U_ZERO_ERROR; |
- u_strFromUTF32(uTarget, 0, &uDestLen, surr32+i, len32-i, &err); |
- if(err != U_INVALID_CHAR_FOUND) { |
- log_err("u_strFromUTF32(preflight surr32+%ld) sets %s != U_INVALID_CHAR_FOUND\n", |
- (long)i, u_errorName(err)); |
- return; |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strFromUTF32(uTarget, UPRV_LENGTHOF(uTarget), &uDestLen, surr32+i, len32-i, &err); |
- if(err != U_INVALID_CHAR_FOUND) { |
- log_err("u_strFromUTF32(surr32+%ld) sets %s != U_INVALID_CHAR_FOUND\n", |
- (long)i, u_errorName(err)); |
- return; |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strFromUTF32(NULL, 0, &uDestLen, surr32+i, -1, &err); |
- if(err != U_INVALID_CHAR_FOUND) { |
- log_err("u_strFromUTF32(preflight surr32+%ld/NUL) sets %s != U_INVALID_CHAR_FOUND\n", |
- (long)i, u_errorName(err)); |
- return; |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strFromUTF32(uTarget, UPRV_LENGTHOF(uTarget), &uDestLen, surr32+i, -1, &err); |
- if(err != U_INVALID_CHAR_FOUND) { |
- log_err("u_strFromUTF32(surr32+%ld/NUL) sets %s != U_INVALID_CHAR_FOUND\n", |
- (long)i, u_errorName(err)); |
- return; |
- } |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strFromUTF32(uTarget, 0, &uDestLen, surr32+6, len32-6-1, &err); |
- if(err != U_BUFFER_OVERFLOW_ERROR || uDestLen != 4) { |
- log_err("u_strFromUTF32(preflight surr32+6) sets %s != U_BUFFER_OVERFLOW_ERROR or an unexpected length\n", |
- u_errorName(err)); |
- return; |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strFromUTF32(uTarget, UPRV_LENGTHOF(uTarget), &uDestLen, surr32+6, len32-6-1, &err); |
- if(err != U_ZERO_ERROR || uDestLen != 4 || u_memcmp(uTarget, expected, 5)) { |
- log_err("u_strFromUTF32(surr32+6) sets %s != U_ZERO_ERROR or does not produce the expected string\n", |
- u_errorName(err)); |
- return; |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strFromUTF32(NULL, 0, &uDestLen, surr32+6, -1, &err); |
- if(err != U_BUFFER_OVERFLOW_ERROR || uDestLen != 4) { |
- log_err("u_strFromUTF32(preflight surr32+6/NUL) sets %s != U_BUFFER_OVERFLOW_ERROR or an unexpected length\n", |
- u_errorName(err)); |
- return; |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strFromUTF32(uTarget, UPRV_LENGTHOF(uTarget), &uDestLen, surr32+6, -1, &err); |
- if(err != U_ZERO_ERROR || uDestLen != 4 || u_memcmp(uTarget, expected, 5)) { |
- log_err("u_strFromUTF32(surr32+6/NUL) sets %s != U_ZERO_ERROR or does not produce the expected string\n", |
- u_errorName(err)); |
- return; |
- } |
- |
- /* with substitution character */ |
- numSubstitutions = -1; |
- err = U_ZERO_ERROR; |
- u_strFromUTF32WithSub(uTarget, 0, &uDestLen, surr32, len32-1, 0xfffd, &numSubstitutions, &err); |
- if(err != U_BUFFER_OVERFLOW_ERROR || uDestLen != 10 || numSubstitutions != 4) { |
- log_err("u_strFromUTF32WithSub(preflight surr32) sets %s != U_BUFFER_OVERFLOW_ERROR or an unexpected length\n", |
- u_errorName(err)); |
- return; |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strFromUTF32WithSub(uTarget, UPRV_LENGTHOF(uTarget), &uDestLen, surr32, len32-1, 0xfffd, &numSubstitutions, &err); |
- if(err != U_ZERO_ERROR || uDestLen != 10 || numSubstitutions != 4 || u_memcmp(uTarget, expected_FFFD, 11)) { |
- log_err("u_strFromUTF32WithSub(surr32) sets %s != U_ZERO_ERROR or does not produce the expected string\n", |
- u_errorName(err)); |
- return; |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strFromUTF32WithSub(NULL, 0, &uDestLen, surr32, -1, 0x12345, &numSubstitutions, &err); |
- if(err != U_BUFFER_OVERFLOW_ERROR || uDestLen != 14 || numSubstitutions != 4) { |
- log_err("u_strFromUTF32WithSub(preflight surr32/NUL) sets %s != U_BUFFER_OVERFLOW_ERROR or an unexpected length\n", |
- u_errorName(err)); |
- return; |
- } |
- |
- err = U_ZERO_ERROR; |
- u_strFromUTF32WithSub(uTarget, UPRV_LENGTHOF(uTarget), &uDestLen, surr32, -1, 0x12345, &numSubstitutions, &err); |
- if(err != U_ZERO_ERROR || uDestLen != 14 || numSubstitutions != 4 || u_memcmp(uTarget, expected_12345, 15)) { |
- log_err("u_strFromUTF32WithSub(surr32/NUL) sets %s != U_ZERO_ERROR or does not produce the expected string\n", |
- u_errorName(err)); |
- return; |
- } |
-} |
- |
-static void Test_UChar_UTF8_API(void){ |
- |
- UErrorCode err = U_ZERO_ERROR; |
- UChar uTemp[1]; |
- char u8Temp[1]; |
- UChar* uTarget=uTemp; |
- const char* u8Src; |
- int32_t u8SrcLen = 0; |
- int32_t uTargetLength = 0; |
- int32_t uDestLen=0; |
- const UChar* uSrc = src16; |
- int32_t uSrcLen = sizeof(src16)/2; |
- char* u8Target = u8Temp; |
- int32_t u8TargetLength =0; |
- int32_t u8DestLen =0; |
- UBool failed = FALSE; |
- int i= 0; |
- int32_t numSubstitutions; |
- |
- { |
- /* preflight */ |
- u8Temp[0] = 0x12; |
- u_strToUTF8(u8Target,u8TargetLength, &u8DestLen, uSrc, uSrcLen,&err); |
- if(err == U_BUFFER_OVERFLOW_ERROR && u8Temp[0] == 0x12){ |
- err = U_ZERO_ERROR; |
- u8Target = (char*) malloc (sizeof(uint8_t) * (u8DestLen+1)); |
- u8TargetLength = u8DestLen; |
- |
- u8Target[u8TargetLength] = (char)0xfe; |
- u8DestLen = -1; |
- u_strToUTF8(u8Target,u8TargetLength, &u8DestLen, uSrc, uSrcLen,&err); |
- if(U_FAILURE(err) || u8DestLen != u8TargetLength || u8Target[u8TargetLength] != (char)0xfe){ |
- log_err("u_strToUTF8 failed after preflight. Error: %s\n", u_errorName(err)); |
- return; |
- } |
- |
- } |
- else { |
- log_err("Should have gotten U_BUFFER_OVERFLOW_ERROR"); |
- } |
- failed = FALSE; |
- /*for(i=0; i< u8DestLen; i++){ |
- printf("0x%04X, ",u8Target[i]); |
- if(i%10==0){ |
- printf("\n"); |
- } |
- }*/ |
- /*for(i=0; i< u8DestLen; i++){ |
- if(u8Target[i] != src8[i]){ |
- log_verbose("u_strToUTF8() failed expected: %04X got: %04X \n", src8[i], u8Target[i]); |
- failed =TRUE; |
- } |
- } |
- if(failed){ |
- log_err("u_strToUTF8() failed \n"); |
- }*/ |
- u8Src = u8Target; |
- u8SrcLen = u8DestLen; |
- |
- /* preflight */ |
- uTemp[0] = 0x1234; |
- u_strFromUTF8(uTarget,uTargetLength,&uDestLen,u8Src,u8SrcLen,&err); |
- if(err == U_BUFFER_OVERFLOW_ERROR && uTemp[0] == 0x1234){ |
- err = U_ZERO_ERROR; |
- uTarget = (UChar*) malloc( sizeof(UChar) * (uDestLen+1)); |
- uTargetLength = uDestLen; |
- |
- uTarget[uTargetLength] = 0xfff0; |
- uDestLen = -1; |
- u_strFromUTF8(uTarget,uTargetLength,&uDestLen,u8Src,u8SrcLen,&err); |
- } |
- else { |
- log_err("error: u_strFromUTF8(preflight) should have gotten U_BUFFER_OVERFLOW_ERROR\n"); |
- } |
- /*for(i=0; i< uDestLen; i++){ |
- printf("0x%04X, ",uTarget[i]); |
- if(i%10==0){ |
- printf("\n"); |
- } |
- }*/ |
- |
- if(U_FAILURE(err) || uDestLen != uTargetLength || uTarget[uTargetLength] != 0xfff0) { |
- failed = TRUE; |
- } |
- for(i=0; i< uSrcLen; i++){ |
- if(uTarget[i] != src16[i]){ |
- log_verbose("u_strFromUTF8() failed expected: \\u%04X got: \\u%04X at index: %i \n", src16[i] ,uTarget[i],i); |
- failed =TRUE; |
- } |
- } |
- if(failed){ |
- log_err("error: u_strFromUTF8(after preflighting) failed\n"); |
- } |
- |
- free(u8Target); |
- free(uTarget); |
- } |
- { |
- u8SrcLen = -1; |
- uTargetLength = 0; |
- uSrcLen =-1; |
- u8TargetLength=0; |
- failed = FALSE; |
- /* preflight */ |
- u_strToUTF8(NULL,u8TargetLength, &u8DestLen, uSrc, uSrcLen,&err); |
- if(err == U_BUFFER_OVERFLOW_ERROR){ |
- err = U_ZERO_ERROR; |
- u8Target = (char*) malloc (sizeof(uint8_t) * (u8DestLen+1)); |
- u8TargetLength = u8DestLen; |
- |
- u_strToUTF8(u8Target,u8TargetLength, &u8DestLen, uSrc, uSrcLen,&err); |
- |
- } |
- else { |
- log_err("Should have gotten U_BUFFER_OVERFLOW_ERROR"); |
- } |
- failed = FALSE; |
- /*for(i=0; i< u8DestLen; i++){ |
- printf("0x%04X, ",u8Target[i]); |
- if(i%10==0){ |
- printf("\n"); |
- } |
- }*/ |
- /*for(i=0; i< u8DestLen; i++){ |
- if(u8Target[i] != src8[i]){ |
- log_verbose("u_strToUTF8() failed expected: %04X got: %04X \n", src8[i], u8Target[i]); |
- failed =TRUE; |
- } |
- } |
- if(failed){ |
- log_err("u_strToUTF8() failed \n"); |
- }*/ |
- u8Src = u8Target; |
- u8SrcLen = u8DestLen; |
- |
- /* preflight */ |
- u_strFromUTF8(NULL,uTargetLength,&uDestLen,u8Src,u8SrcLen,&err); |
- if(err == U_BUFFER_OVERFLOW_ERROR){ |
- err = U_ZERO_ERROR; |
- uTarget = (UChar*) malloc( sizeof(UChar) * (uDestLen+1)); |
- uTargetLength = uDestLen; |
- |
- u_strFromUTF8(uTarget,uTargetLength,&uDestLen,u8Src,u8SrcLen,&err); |
- } |
- else { |
- log_err("Should have gotten U_BUFFER_OVERFLOW_ERROR"); |
- } |
- /*for(i=0; i< uDestLen; i++){ |
- printf("0x%04X, ",uTarget[i]); |
- if(i%10==0){ |
- printf("\n"); |
- } |
- }*/ |
- |
- for(i=0; i< uSrcLen; i++){ |
- if(uTarget[i] != src16[i]){ |
- log_verbose("u_strFromUTF8() failed expected: \\u%04X got: \\u%04X at index: %i \n", src16[i] ,uTarget[i],i); |
- failed =TRUE; |
- } |
- } |
- if(failed){ |
- log_err("u_strToUTF8() failed \n"); |
- } |
- |
- free(u8Target); |
- free(uTarget); |
- } |
- |
- /* test UTF-8 with single surrogates - illegal in Unicode 3.2 */ |
- { |
- static const UChar |
- withLead16[]={ 0x1800, 0xd89a, 0x0061 }, |
- withTrail16[]={ 0x1800, 0xdcba, 0x0061, 0 }, |
- withTrail16SubFFFD[]={ 0x1800, 0xfffd, 0x0061, 0 }, /* sub==U+FFFD */ |
- withTrail16Sub50005[]={ 0x1800, 0xd900, 0xdc05, 0x0061, 0 }; /* sub==U+50005 */ |
- static const uint8_t |
- withLead8[]={ 0xe1, 0xa0, 0x80, 0xed, 0xa2, 0x9a, 0x61 }, |
- withTrail8[]={ 0xe1, 0xa0, 0x80, 0xed, 0xb2, 0xba, 0x61, 0 }, |
- withTrail8Sub1A[]={ 0xe1, 0xa0, 0x80, 0x1a, 0x61, 0 }, /* sub==U+001A */ |
- withTrail8SubFFFD[]={ 0xe1, 0xa0, 0x80, 0xef, 0xbf, 0xbd, 0x61, 0 }; /* sub==U+FFFD */ |
- UChar out16[10]; |
- char out8[10]; |
- |
- if( |
- (err=U_ZERO_ERROR, u_strToUTF8(out8, UPRV_LENGTHOF(out8), NULL, withLead16, UPRV_LENGTHOF(withLead16), &err), err!=U_INVALID_CHAR_FOUND) || |
- (err=U_ZERO_ERROR, u_strToUTF8(out8, UPRV_LENGTHOF(out8), NULL, withTrail16, -1, &err), err!=U_INVALID_CHAR_FOUND) || |
- (err=U_ZERO_ERROR, u_strFromUTF8(out16, UPRV_LENGTHOF(out16), NULL, (const char *)withLead8, UPRV_LENGTHOF(withLead8), &err), err!=U_INVALID_CHAR_FOUND) || |
- (err=U_ZERO_ERROR, u_strFromUTF8(out16, UPRV_LENGTHOF(out16), NULL, (const char *)withTrail8, -1, &err), err!=U_INVALID_CHAR_FOUND) |
- ) { |
- log_err("error: u_strTo/FromUTF8(string with single surrogate) fails to report error\n"); |
- } |
- |
- /* test error handling with substitution characters */ |
- |
- /* from UTF-8 with length */ |
- err=U_ZERO_ERROR; |
- numSubstitutions=-1; |
- out16[0]=0x55aa; |
- uDestLen=0; |
- u_strFromUTF8WithSub(out16, UPRV_LENGTHOF(out16), &uDestLen, |
- (const char *)withTrail8, uprv_strlen((const char *)withTrail8), |
- 0x50005, &numSubstitutions, |
- &err); |
- if(U_FAILURE(err) || uDestLen!=u_strlen(withTrail16Sub50005) || |
- 0!=u_memcmp(withTrail16Sub50005, out16, uDestLen+1) || |
- numSubstitutions!=1) { |
- log_err("error: u_strFromUTF8WithSub(length) failed\n"); |
- } |
- |
- /* from UTF-8 with NUL termination */ |
- err=U_ZERO_ERROR; |
- numSubstitutions=-1; |
- out16[0]=0x55aa; |
- uDestLen=0; |
- u_strFromUTF8WithSub(out16, UPRV_LENGTHOF(out16), &uDestLen, |
- (const char *)withTrail8, -1, |
- 0xfffd, &numSubstitutions, |
- &err); |
- if(U_FAILURE(err) || uDestLen!=u_strlen(withTrail16SubFFFD) || |
- 0!=u_memcmp(withTrail16SubFFFD, out16, uDestLen+1) || |
- numSubstitutions!=1) { |
- log_err("error: u_strFromUTF8WithSub(NUL termination) failed\n"); |
- } |
- |
- /* preflight from UTF-8 with NUL termination */ |
- err=U_ZERO_ERROR; |
- numSubstitutions=-1; |
- out16[0]=0x55aa; |
- uDestLen=0; |
- u_strFromUTF8WithSub(out16, 1, &uDestLen, |
- (const char *)withTrail8, -1, |
- 0x50005, &numSubstitutions, |
- &err); |
- if(err!=U_BUFFER_OVERFLOW_ERROR || uDestLen!=u_strlen(withTrail16Sub50005) || numSubstitutions!=1) { |
- log_err("error: u_strFromUTF8WithSub(preflight/NUL termination) failed\n"); |
- } |
- |
- /* to UTF-8 with length */ |
- err=U_ZERO_ERROR; |
- numSubstitutions=-1; |
- out8[0]=(char)0xf5; |
- u8DestLen=0; |
- u_strToUTF8WithSub(out8, UPRV_LENGTHOF(out8), &u8DestLen, |
- withTrail16, u_strlen(withTrail16), |
- 0xfffd, &numSubstitutions, |
- &err); |
- if(U_FAILURE(err) || u8DestLen!=uprv_strlen((const char *)withTrail8SubFFFD) || |
- 0!=uprv_memcmp((const char *)withTrail8SubFFFD, out8, u8DestLen+1) || |
- numSubstitutions!=1) { |
- log_err("error: u_strToUTF8WithSub(length) failed\n"); |
- } |
- |
- /* to UTF-8 with NUL termination */ |
- err=U_ZERO_ERROR; |
- numSubstitutions=-1; |
- out8[0]=(char)0xf5; |
- u8DestLen=0; |
- u_strToUTF8WithSub(out8, UPRV_LENGTHOF(out8), &u8DestLen, |
- withTrail16, -1, |
- 0x1a, &numSubstitutions, |
- &err); |
- if(U_FAILURE(err) || u8DestLen!=uprv_strlen((const char *)withTrail8Sub1A) || |
- 0!=uprv_memcmp((const char *)withTrail8Sub1A, out8, u8DestLen+1) || |
- numSubstitutions!=1) { |
- log_err("error: u_strToUTF8WithSub(NUL termination) failed\n"); |
- } |
- |
- /* preflight to UTF-8 with NUL termination */ |
- err=U_ZERO_ERROR; |
- numSubstitutions=-1; |
- out8[0]=(char)0xf5; |
- u8DestLen=0; |
- u_strToUTF8WithSub(out8, 1, &u8DestLen, |
- withTrail16, -1, |
- 0xfffd, &numSubstitutions, |
- &err); |
- if(err!=U_BUFFER_OVERFLOW_ERROR || u8DestLen!=uprv_strlen((const char *)withTrail8SubFFFD) || |
- numSubstitutions!=1) { |
- log_err("error: u_strToUTF8WithSub(preflight/NUL termination) failed\n"); |
- } |
- |
- /* test that numSubstitutions==0 if there are no substitutions */ |
- |
- /* from UTF-8 with length (just first 3 bytes which are valid) */ |
- err=U_ZERO_ERROR; |
- numSubstitutions=-1; |
- out16[0]=0x55aa; |
- uDestLen=0; |
- u_strFromUTF8WithSub(out16, UPRV_LENGTHOF(out16), &uDestLen, |
- (const char *)withTrail8, 3, |
- 0x50005, &numSubstitutions, |
- &err); |
- if(U_FAILURE(err) || uDestLen!=1 || |
- 0!=u_memcmp(withTrail16Sub50005, out16, uDestLen) || |
- numSubstitutions!=0) { |
- log_err("error: u_strFromUTF8WithSub(no subs) failed\n"); |
- } |
- |
- /* to UTF-8 with length (just first UChar which is valid) */ |
- err=U_ZERO_ERROR; |
- numSubstitutions=-1; |
- out8[0]=(char)0xf5; |
- u8DestLen=0; |
- u_strToUTF8WithSub(out8, UPRV_LENGTHOF(out8), &u8DestLen, |
- withTrail16, 1, |
- 0xfffd, &numSubstitutions, |
- &err); |
- if(U_FAILURE(err) || u8DestLen!=3 || |
- 0!=uprv_memcmp((const char *)withTrail8SubFFFD, out8, u8DestLen) || |
- numSubstitutions!=0) { |
- log_err("error: u_strToUTF8WithSub(no subs) failed\n"); |
- } |
- |
- /* test that numSubstitutions==0 if subchar==U_SENTINEL (no subchar) */ |
- |
- /* from UTF-8 with length (just first 3 bytes which are valid) */ |
- err=U_ZERO_ERROR; |
- numSubstitutions=-1; |
- out16[0]=0x55aa; |
- uDestLen=0; |
- u_strFromUTF8WithSub(out16, UPRV_LENGTHOF(out16), &uDestLen, |
- (const char *)withTrail8, 3, |
- U_SENTINEL, &numSubstitutions, |
- &err); |
- if(U_FAILURE(err) || uDestLen!=1 || |
- 0!=u_memcmp(withTrail16Sub50005, out16, uDestLen) || |
- numSubstitutions!=0) { |
- log_err("error: u_strFromUTF8WithSub(no subchar) failed\n"); |
- } |
- |
- /* to UTF-8 with length (just first UChar which is valid) */ |
- err=U_ZERO_ERROR; |
- numSubstitutions=-1; |
- out8[0]=(char)0xf5; |
- u8DestLen=0; |
- u_strToUTF8WithSub(out8, UPRV_LENGTHOF(out8), &u8DestLen, |
- withTrail16, 1, |
- U_SENTINEL, &numSubstitutions, |
- &err); |
- if(U_FAILURE(err) || u8DestLen!=3 || |
- 0!=uprv_memcmp((const char *)withTrail8SubFFFD, out8, u8DestLen) || |
- numSubstitutions!=0) { |
- log_err("error: u_strToUTF8WithSub(no subchar) failed\n"); |
- } |
- } |
- { |
- /* |
- * Test with an illegal lead byte that would be followed by more than 3 trail bytes. |
- * See ticket #10371. |
- */ |
- static const char src[1]={ (char)0xf8 }; |
- UChar out16[10]; |
- err=U_ZERO_ERROR; |
- u_strFromUTF8(out16, UPRV_LENGTHOF(out16), NULL, src, 1, &err); |
- if(err!=U_INVALID_CHAR_FOUND) { |
- log_err("error: u_strFromUTF8(5-byte lead byte) failed\n"); |
- } |
- } |
-} |
- |
-/* compare if two strings are equal, but match 0xfffd in the second string with anything in the first */ |
-static UBool |
-equalAnyFFFD(const UChar *s, const UChar *t, int32_t length) { |
- UChar c1, c2; |
- |
- while(length>0) { |
- c1=*s++; |
- c2=*t++; |
- if(c1!=c2 && c2!=0xfffd) { |
- return FALSE; |
- } |
- --length; |
- } |
- return TRUE; |
-} |
- |
-/* test u_strFromUTF8Lenient() */ |
-static void |
-Test_FromUTF8(void) { |
- /* |
- * Test case from icu-support list 20071130 "u_strFromUTF8() returns U_INVALID_CHAR_FOUND(10)" |
- */ |
- static const uint8_t bytes[]={ 0xe0, 0xa5, 0x9c, 0 }; |
- UChar dest[64]; |
- UChar *destPointer; |
- int32_t destLength; |
- UErrorCode errorCode; |
- |
- /* 3 bytes input, one UChar output (U+095C) */ |
- errorCode=U_ZERO_ERROR; |
- destLength=-99; |
- destPointer=u_strFromUTF8(NULL, 0, &destLength, (const char *)bytes, 3, &errorCode); |
- if(errorCode!=U_BUFFER_OVERFLOW_ERROR || destPointer!=NULL || destLength!=1) { |
- log_err("error: u_strFromUTF8(preflight srcLength=3) fails: destLength=%ld - %s\n", |
- (long)destLength, u_errorName(errorCode)); |
- } |
- |
- /* 4 bytes input, two UChars output (U+095C U+0000) */ |
- errorCode=U_ZERO_ERROR; |
- destLength=-99; |
- destPointer=u_strFromUTF8(NULL, 0, &destLength, (const char *)bytes, 4, &errorCode); |
- if(errorCode!=U_BUFFER_OVERFLOW_ERROR || destPointer!=NULL || destLength!=2) { |
- log_err("error: u_strFromUTF8(preflight srcLength=4) fails: destLength=%ld - %s\n", |
- (long)destLength, u_errorName(errorCode)); |
- } |
- |
- /* NUL-terminated 3 bytes input, one UChar output (U+095C) */ |
- errorCode=U_ZERO_ERROR; |
- destLength=-99; |
- destPointer=u_strFromUTF8(NULL, 0, &destLength, (const char *)bytes, -1, &errorCode); |
- if(errorCode!=U_BUFFER_OVERFLOW_ERROR || destPointer!=NULL || destLength!=1) { |
- log_err("error: u_strFromUTF8(preflight srcLength=-1) fails: destLength=%ld - %s\n", |
- (long)destLength, u_errorName(errorCode)); |
- } |
- |
- /* 3 bytes input, one UChar output (U+095C), transform not just preflight */ |
- errorCode=U_ZERO_ERROR; |
- dest[0]=dest[1]=99; |
- destLength=-99; |
- destPointer=u_strFromUTF8(dest, UPRV_LENGTHOF(dest), &destLength, (const char *)bytes, 3, &errorCode); |
- if(U_FAILURE(errorCode) || destPointer!=dest || destLength!=1 || dest[0]!=0x95c || dest[1]!=0) { |
- log_err("error: u_strFromUTF8(transform srcLength=3) fails: destLength=%ld - %s\n", |
- (long)destLength, u_errorName(errorCode)); |
- } |
-} |
- |
-/* test u_strFromUTF8Lenient() */ |
-static void |
-Test_FromUTF8Lenient(void) { |
- /* |
- * Multiple input strings, each NUL-terminated. |
- * Terminate with a string starting with 0xff. |
- */ |
- static const uint8_t bytes[]={ |
- /* well-formed UTF-8 */ |
- 0x61, 0xc3, 0x9f, 0xe0, 0xa0, 0x80, 0xf0, 0xa0, 0x80, 0x80, |
- 0x62, 0xc3, 0xa0, 0xe0, 0xa0, 0x81, 0xf0, 0xa0, 0x80, 0x81, 0, |
- |
- /* various malformed sequences */ |
- 0xc3, 0xc3, 0x9f, 0xc3, 0xa0, 0xe0, 0x80, 0x8a, 0xf0, 0x41, 0x42, 0x43, 0, |
- |
- /* truncated input */ |
- 0xc3, 0, |
- 0xe0, 0, |
- 0xe0, 0xa0, 0, |
- 0xf0, 0, |
- 0xf0, 0x90, 0, |
- 0xf0, 0x90, 0x80, 0, |
- |
- /* non-ASCII characters in the last few bytes */ |
- 0x61, 0xc3, 0x9f, 0xe0, 0xa0, 0x80, 0, |
- 0x61, 0xe0, 0xa0, 0x80, 0xc3, 0x9f, 0, |
- |
- /* empty string */ |
- 0, |
- |
- /* finish */ |
- 0xff, 0 |
- }; |
- |
- /* Multiple output strings, each NUL-terminated. 0xfffd matches anything. */ |
- static const UChar uchars[]={ |
- 0x61, 0xdf, 0x800, 0xd840, 0xdc00, |
- 0x62, 0xe0, 0x801, 0xd840, 0xdc01, 0, |
- |
- 0xfffd, 0x9f, 0xe0, 0xa, 0xfffd, 0xfffd, 0, |
- |
- 0xfffd, 0, |
- 0xfffd, 0, |
- 0xfffd, 0, |
- 0xfffd, 0, |
- 0xfffd, 0, |
- 0xfffd, 0, |
- |
- 0x61, 0xdf, 0x800, 0, |
- 0x61, 0x800, 0xdf, 0, |
- |
- 0, |
- |
- 0 |
- }; |
- |
- UChar dest[64]; |
- const char *pb; |
- const UChar *pu, *pDest; |
- int32_t srcLength, destLength0, destLength; |
- int number; |
- UErrorCode errorCode; |
- |
- /* verify checking for some illegal arguments */ |
- dest[0]=0x1234; |
- destLength=-1; |
- errorCode=U_ZERO_ERROR; |
- pDest=u_strFromUTF8Lenient(dest, 1, &destLength, NULL, -1, &errorCode); |
- if(errorCode!=U_ILLEGAL_ARGUMENT_ERROR || dest[0]!=0x1234) { |
- log_err("u_strFromUTF8Lenient(src=NULL) failed\n"); |
- } |
- |
- dest[0]=0x1234; |
- destLength=-1; |
- errorCode=U_ZERO_ERROR; |
- pDest=u_strFromUTF8Lenient(NULL, 1, &destLength, (const char *)bytes, -1, &errorCode); |
- if(errorCode!=U_ILLEGAL_ARGUMENT_ERROR) { |
- log_err("u_strFromUTF8Lenient(dest=NULL[1]) failed\n"); |
- } |
- |
- dest[0]=0x1234; |
- destLength=-1; |
- errorCode=U_MEMORY_ALLOCATION_ERROR; |
- pDest=u_strFromUTF8Lenient(dest, 1, &destLength, (const char *)bytes, -1, &errorCode); |
- if(errorCode!=U_MEMORY_ALLOCATION_ERROR || dest[0]!=0x1234) { |
- log_err("u_strFromUTF8Lenient(U_MEMORY_ALLOCATION_ERROR) failed\n"); |
- } |
- |
- dest[0]=0x1234; |
- destLength=-1; |
- errorCode=U_MEMORY_ALLOCATION_ERROR; |
- pDest=u_strFromUTF8Lenient(dest, 1, &destLength, (const char *)bytes, -1, NULL); |
- if(dest[0]!=0x1234) { |
- log_err("u_strFromUTF8Lenient(pErrorCode=NULL) failed\n"); |
- } |
- |
- /* test normal behavior */ |
- number=0; /* string number for log_err() */ |
- |
- for(pb=(const char *)bytes, pu=uchars; |
- *pb!=(char)0xff; |
- pb+=srcLength+1, pu+=destLength0+1, ++number |
- ) { |
- srcLength=uprv_strlen(pb); |
- destLength0=u_strlen(pu); |
- |
- /* preflighting with NUL-termination */ |
- dest[0]=0x1234; |
- destLength=-1; |
- errorCode=U_ZERO_ERROR; |
- pDest=u_strFromUTF8Lenient(NULL, 0, &destLength, pb, -1, &errorCode); |
- if (errorCode!= (destLength0==0 ? U_STRING_NOT_TERMINATED_WARNING : U_BUFFER_OVERFLOW_ERROR) || |
- pDest!=NULL || dest[0]!=0x1234 || destLength!=destLength0 |
- ) { |
- log_err("u_strFromUTF8Lenient(%d preflighting with NUL-termination) failed\n", number); |
- } |
- |
- /* preflighting/some capacity with NUL-termination */ |
- if(srcLength>0) { |
- dest[destLength0-1]=0x1234; |
- destLength=-1; |
- errorCode=U_ZERO_ERROR; |
- pDest=u_strFromUTF8Lenient(dest, destLength0-1, &destLength, pb, -1, &errorCode); |
- if (errorCode!=U_BUFFER_OVERFLOW_ERROR || |
- dest[destLength0-1]!=0x1234 || destLength!=destLength0 |
- ) { |
- log_err("u_strFromUTF8Lenient(%d preflighting/some capacity with NUL-termination) failed\n", number); |
- } |
- } |
- |
- /* conversion with NUL-termination, much capacity */ |
- dest[0]=dest[destLength0]=0x1234; |
- destLength=-1; |
- errorCode=U_ZERO_ERROR; |
- pDest=u_strFromUTF8Lenient(dest, UPRV_LENGTHOF(dest), &destLength, pb, -1, &errorCode); |
- if (errorCode!=U_ZERO_ERROR || |
- pDest!=dest || dest[destLength0]!=0 || |
- destLength!=destLength0 || !equalAnyFFFD(dest, pu, destLength) |
- ) { |
- log_err("u_strFromUTF8Lenient(%d conversion with NUL-termination, much capacity) failed\n", number); |
- } |
- |
- /* conversion with NUL-termination, exact capacity */ |
- dest[0]=dest[destLength0]=0x1234; |
- destLength=-1; |
- errorCode=U_ZERO_ERROR; |
- pDest=u_strFromUTF8Lenient(dest, destLength0, &destLength, pb, -1, &errorCode); |
- if (errorCode!=U_STRING_NOT_TERMINATED_WARNING || |
- pDest!=dest || dest[destLength0]!=0x1234 || |
- destLength!=destLength0 || !equalAnyFFFD(dest, pu, destLength) |
- ) { |
- log_err("u_strFromUTF8Lenient(%d conversion with NUL-termination, exact capacity) failed\n", number); |
- } |
- |
- /* preflighting with length */ |
- dest[0]=0x1234; |
- destLength=-1; |
- errorCode=U_ZERO_ERROR; |
- pDest=u_strFromUTF8Lenient(NULL, 0, &destLength, pb, srcLength, &errorCode); |
- if (errorCode!= (destLength0==0 ? U_STRING_NOT_TERMINATED_WARNING : U_BUFFER_OVERFLOW_ERROR) || |
- pDest!=NULL || dest[0]!=0x1234 || destLength!=srcLength |
- ) { |
- log_err("u_strFromUTF8Lenient(%d preflighting with length) failed\n", number); |
- } |
- |
- /* preflighting/some capacity with length */ |
- if(srcLength>0) { |
- dest[srcLength-1]=0x1234; |
- destLength=-1; |
- errorCode=U_ZERO_ERROR; |
- pDest=u_strFromUTF8Lenient(dest, srcLength-1, &destLength, pb, srcLength, &errorCode); |
- if (errorCode!=U_BUFFER_OVERFLOW_ERROR || |
- dest[srcLength-1]!=0x1234 || destLength!=srcLength |
- ) { |
- log_err("u_strFromUTF8Lenient(%d preflighting/some capacity with length) failed\n", number); |
- } |
- } |
- |
- /* conversion with length, much capacity */ |
- dest[0]=dest[destLength0]=0x1234; |
- destLength=-1; |
- errorCode=U_ZERO_ERROR; |
- pDest=u_strFromUTF8Lenient(dest, UPRV_LENGTHOF(dest), &destLength, pb, srcLength, &errorCode); |
- if (errorCode!=U_ZERO_ERROR || |
- pDest!=dest || dest[destLength0]!=0 || |
- destLength!=destLength0 || !equalAnyFFFD(dest, pu, destLength) |
- ) { |
- log_err("u_strFromUTF8Lenient(%d conversion with length, much capacity) failed\n", number); |
- } |
- |
- /* conversion with length, srcLength capacity */ |
- dest[0]=dest[srcLength]=dest[destLength0]=0x1234; |
- destLength=-1; |
- errorCode=U_ZERO_ERROR; |
- pDest=u_strFromUTF8Lenient(dest, srcLength, &destLength, pb, srcLength, &errorCode); |
- if(srcLength==destLength0) { |
- if (errorCode!=U_STRING_NOT_TERMINATED_WARNING || |
- pDest!=dest || dest[destLength0]!=0x1234 || |
- destLength!=destLength0 || !equalAnyFFFD(dest, pu, destLength) |
- ) { |
- log_err("u_strFromUTF8Lenient(%d conversion with length, srcLength capacity/not terminated) failed\n", number); |
- } |
- } else { |
- if (errorCode!=U_ZERO_ERROR || |
- pDest!=dest || dest[destLength0]!=0 || |
- destLength!=destLength0 || !equalAnyFFFD(dest, pu, destLength) |
- ) { |
- log_err("u_strFromUTF8Lenient(%d conversion with length, srcLength capacity/terminated) failed\n", number); |
- } |
- } |
- } |
-} |
- |
-static const uint16_t src16j[] = { |
- 0x0043, 0x0044, 0x0045, 0x0046, 0x0047, 0x0048, 0x0049, 0x004A, 0x000D, 0x000A, |
- 0x004B, 0x004C, 0x004D, 0x004E, 0x004F, 0x0050, 0x0051, 0x0052, 0x000D, 0x000A, |
- 0x0053, 0x0054, 0x0055, 0x0056, 0x0057, 0x0058, 0x0059, 0x005A, 0x000D, 0x000A, |
- 0x0053, 0x0054, 0x0055, 0x0056, 0x0057, 0x0058, 0x0059, 0x005A, 0x000D, 0x000A, |
- 0x0000, |
- /* Test only ASCII */ |
- |
-}; |
-static const uint16_t src16WithNulls[] = { |
- 0x0043, 0x0044, 0x0045, 0x0046, 0x0047, 0x0000, |
- 0x0048, 0x0049, 0x004A, 0x000D, 0x000A, 0x0000, |
- 0x004B, 0x004C, 0x004D, 0x004E, 0x004F, 0x0000, |
- 0x0050, 0x0051, 0x0052, 0x000D, 0x000A, 0x0000, |
- 0x0053, 0x0054, 0x0055, 0x0056, 0x0057, 0x0000, |
- 0x0058, 0x0059, 0x005A, 0x000D, 0x000A, 0x0000, |
- 0x0053, 0x0054, 0x0055, 0x0056, 0x0057, 0x0000, |
- 0x0058, 0x0059, 0x005A, 0x000D, 0x000A, 0x0000, |
- /* test only ASCII */ |
- /* |
- 0x00A8, 0x00A9, 0x00AA, 0x00AB, 0x00AC, 0x00AD, |
- 0x00AE, 0x00AF, 0x00B0, 0x00B1, 0x00B2, 0x00B3, 0x00B4, 0x00B5, 0x00B6, 0x00B7, |
- 0x00B8, 0x00B9, 0x00BA, 0x00BB, 0x00BC, 0x00BD, 0x00BE, 0x00BF, 0x00C0, 0x00C1, |
- 0x00C2, 0x00C3, 0x00C4, 0x00C5, 0x00C6, 0x00C7, 0x00C8, 0x00C9, 0x00CA, 0x00CB, |
- 0x00CC, 0x00CD, 0x00CE, 0x00CF, 0x00D0, 0x00D1, 0x00D2, 0x00D3, 0x00D4, 0x00D5, |
- 0x00D6, 0x00D7, 0x00D8, 0x00D9, 0x00DA, 0x00DB, 0x00DC, 0x00DD, 0x00DE, 0x00DF, |
- 0x00E0, 0x00E1, 0x00E2, 0x00E3, 0x00E4, 0x00E5, 0x00E6, 0x00E7, 0x00E8, 0x00E9, |
- 0x0054, 0x0000 */ |
- |
-}; |
-static void Test_UChar_WCHART_API(void){ |
-#if (defined(U_WCHAR_IS_UTF16) || defined(U_WCHAR_IS_UTF32)) || (!UCONFIG_NO_CONVERSION && !UCONFIG_NO_LEGACY_CONVERSION) |
- UErrorCode err = U_ZERO_ERROR; |
- const UChar* uSrc = src16j; |
- int32_t uSrcLen = sizeof(src16j)/2; |
- wchar_t* wDest = NULL; |
- int32_t wDestLen = 0; |
- int32_t reqLen= 0 ; |
- UBool failed = FALSE; |
- UChar* uDest = NULL; |
- int32_t uDestLen = 0; |
- int i =0; |
- { |
- /* Bad UErrorCode arguments. Make sure that the API doesn't crash, and that Purify doesn't complain. */ |
- if (u_strFromWCS(NULL,0,NULL,NULL,0,NULL) != NULL) { |
- log_err("u_strFromWCS() should return NULL with a bad argument\n"); |
- } |
- if (u_strToWCS(NULL,0,NULL,NULL,0,NULL) != NULL) { |
- log_err("u_strToWCS() should return NULL with a bad argument\n"); |
- } |
- |
- /* NULL source & destination. */ |
- err = U_ZERO_ERROR; |
- u_strFromWCS(NULL,0,NULL,NULL,0,&err); |
- if (err != U_STRING_NOT_TERMINATED_WARNING) { |
- log_err("u_strFromWCS(NULL, NULL) failed. Error: %s \n", u_errorName(err)); |
- } |
- err = U_ZERO_ERROR; |
- u_strToWCS(NULL,0,NULL,NULL,0,&err); |
- if (err != U_STRING_NOT_TERMINATED_WARNING) { |
- log_err("u_strToWCS(NULL, NULL) failed. Error: %s \n", u_errorName(err)); |
- } |
- err = U_ZERO_ERROR; |
- |
- /* pre-flight*/ |
- u_strToWCS(wDest,wDestLen,&reqLen,uSrc,uSrcLen-1,&err); |
- |
- if(err == U_BUFFER_OVERFLOW_ERROR){ |
- err=U_ZERO_ERROR; |
- wDest =(wchar_t*) malloc(sizeof(wchar_t) * (reqLen+1)); |
- wDestLen = reqLen+1; |
- u_strToWCS(wDest,wDestLen,&reqLen,uSrc,uSrcLen-1,&err); |
- } |
- |
- /* pre-flight */ |
- u_strFromWCS(uDest, uDestLen,&reqLen,wDest,reqLen,&err); |
- |
- |
- if(err == U_BUFFER_OVERFLOW_ERROR){ |
- err =U_ZERO_ERROR; |
- uDest = (UChar*) malloc(sizeof(UChar) * (reqLen+1)); |
- uDestLen = reqLen + 1; |
- u_strFromWCS(uDest, uDestLen,&reqLen,wDest,reqLen,&err); |
- }else if(U_FAILURE(err)){ |
- |
- log_err("u_strFromWCS() failed. Error: %s \n", u_errorName(err)); |
- return; |
- } |
- |
- for(i=0; i< uSrcLen; i++){ |
- if(uDest[i] != src16j[i]){ |
- log_verbose("u_str*WCS() failed for unterminated string expected: \\u%04X got: \\u%04X at index: %i \n", src16j[i] ,uDest[i],i); |
- failed =TRUE; |
- } |
- } |
- |
- if(U_FAILURE(err)){ |
- failed = TRUE; |
- } |
- if(failed){ |
- log_err("u_strToWCS() failed \n"); |
- } |
- free(wDest); |
- free(uDest); |
- |
- |
- /* test with embeded nulls */ |
- uSrc = src16WithNulls; |
- uSrcLen = sizeof(src16WithNulls)/2; |
- wDestLen =0; |
- uDestLen =0; |
- wDest = NULL; |
- uDest = NULL; |
- /* pre-flight*/ |
- u_strToWCS(wDest,wDestLen,&reqLen,uSrc,uSrcLen-1,&err); |
- |
- if(err == U_BUFFER_OVERFLOW_ERROR){ |
- err=U_ZERO_ERROR; |
- wDest =(wchar_t*) malloc(sizeof(wchar_t) * (reqLen+1)); |
- wDestLen = reqLen+1; |
- u_strToWCS(wDest,wDestLen,&reqLen,uSrc,uSrcLen-1,&err); |
- } |
- |
- /* pre-flight */ |
- u_strFromWCS(uDest, uDestLen,&reqLen,wDest,reqLen,&err); |
- |
- if(err == U_BUFFER_OVERFLOW_ERROR){ |
- err =U_ZERO_ERROR; |
- uDest = (UChar*) malloc(sizeof(UChar) * (reqLen+1)); |
- uDestLen = reqLen + 1; |
- u_strFromWCS(uDest, uDestLen,&reqLen,wDest,reqLen,&err); |
- } |
- |
- if(!U_FAILURE(err)) { |
- for(i=0; i< uSrcLen; i++){ |
- if(uDest[i] != src16WithNulls[i]){ |
- log_verbose("u_str*WCS() failed for string with nulls expected: \\u%04X got: \\u%04X at index: %i \n", src16WithNulls[i] ,uDest[i],i); |
- failed =TRUE; |
- } |
- } |
- } |
- |
- if(U_FAILURE(err)){ |
- failed = TRUE; |
- } |
- if(failed){ |
- log_err("u_strToWCS() failed \n"); |
- } |
- free(wDest); |
- free(uDest); |
- |
- } |
- |
- { |
- |
- uSrc = src16j; |
- uSrcLen = sizeof(src16j)/2; |
- wDestLen =0; |
- uDestLen =0; |
- wDest = NULL; |
- uDest = NULL; |
- wDestLen = 0; |
- /* pre-flight*/ |
- u_strToWCS(wDest,wDestLen,&reqLen,uSrc,-1,&err); |
- |
- if(err == U_BUFFER_OVERFLOW_ERROR){ |
- err=U_ZERO_ERROR; |
- wDest =(wchar_t*) malloc(sizeof(wchar_t) * (reqLen+1)); |
- wDestLen = reqLen+1; |
- u_strToWCS(wDest,wDestLen,&reqLen,uSrc,-1,&err); |
- } |
- uDestLen = 0; |
- /* pre-flight */ |
- u_strFromWCS(uDest, uDestLen,&reqLen,wDest,-1,&err); |
- |
- if(err == U_BUFFER_OVERFLOW_ERROR){ |
- err =U_ZERO_ERROR; |
- uDest = (UChar*) malloc(sizeof(UChar) * (reqLen+1)); |
- uDestLen = reqLen + 1; |
- u_strFromWCS(uDest, uDestLen,&reqLen,wDest,-1,&err); |
- } |
- |
- |
- if(!U_FAILURE(err)) { |
- for(i=0; i< uSrcLen; i++){ |
- if(uDest[i] != src16j[i]){ |
- log_verbose("u_str*WCS() failed for null terminated string expected: \\u%04X got: \\u%04X at index: %i \n", src16j[i] ,uDest[i],i); |
- failed =TRUE; |
- } |
- } |
- } |
- |
- if(U_FAILURE(err)){ |
- failed = TRUE; |
- } |
- if(failed){ |
- log_err("u_strToWCS() failed \n"); |
- } |
- free(wDest); |
- free(uDest); |
- } |
- |
- /* |
- * Test u_terminateWChars(). |
- * All u_terminateXYZ() use the same implementation macro; |
- * we test this function to improve API coverage. |
- */ |
- { |
- wchar_t buffer[10]; |
- |
- err=U_ZERO_ERROR; |
- buffer[3]=0x20ac; |
- wDestLen=u_terminateWChars(buffer, UPRV_LENGTHOF(buffer), 3, &err); |
- if(err!=U_ZERO_ERROR || wDestLen!=3 || buffer[3]!=0) { |
- log_err("u_terminateWChars(buffer, all, 3, zero) failed: %s length %d [3]==U+%04x\n", |
- u_errorName(err), wDestLen, buffer[3]); |
- } |
- |
- err=U_ZERO_ERROR; |
- buffer[3]=0x20ac; |
- wDestLen=u_terminateWChars(buffer, 3, 3, &err); |
- if(err!=U_STRING_NOT_TERMINATED_WARNING || wDestLen!=3 || buffer[3]!=0x20ac) { |
- log_err("u_terminateWChars(buffer, 3, 3, zero) failed: %s length %d [3]==U+%04x\n", |
- u_errorName(err), wDestLen, buffer[3]); |
- } |
- |
- err=U_STRING_NOT_TERMINATED_WARNING; |
- buffer[3]=0x20ac; |
- wDestLen=u_terminateWChars(buffer, UPRV_LENGTHOF(buffer), 3, &err); |
- if(err!=U_ZERO_ERROR || wDestLen!=3 || buffer[3]!=0) { |
- log_err("u_terminateWChars(buffer, all, 3, not-terminated) failed: %s length %d [3]==U+%04x\n", |
- u_errorName(err), wDestLen, buffer[3]); |
- } |
- |
- err=U_ZERO_ERROR; |
- buffer[3]=0x20ac; |
- wDestLen=u_terminateWChars(buffer, 2, 3, &err); |
- if(err!=U_BUFFER_OVERFLOW_ERROR || wDestLen!=3 || buffer[3]!=0x20ac) { |
- log_err("u_terminateWChars(buffer, 2, 3, zero) failed: %s length %d [3]==U+%04x\n", |
- u_errorName(err), wDestLen, buffer[3]); |
- } |
- } |
-#else |
- log_info("Not testing u_str*WCS because (!UCONFIG_NO_CONVERSION && !UCONFIG_NO_LEGACY_CONVERSION) and wchar is neither utf16 nor utf32"); |
-#endif |
-} |
- |
-static void Test_widestrs() |
-{ |
-#if (defined(U_WCHAR_IS_UTF16) || defined(U_WCHAR_IS_UTF32)) || (!UCONFIG_NO_CONVERSION && !UCONFIG_NO_LEGACY_CONVERSION) |
- wchar_t ws[100]; |
- UChar rts[100]; |
- int32_t wcap = sizeof(ws) / sizeof(*ws); |
- int32_t wl; |
- int32_t rtcap = sizeof(rts) / sizeof(*rts); |
- int32_t rtl; |
- wchar_t *wcs; |
- UChar *cp; |
- const char *errname; |
- UChar ustr[] = {'h', 'e', 'l', 'l', 'o', 0}; |
- int32_t ul = sizeof(ustr)/sizeof(*ustr) -1; |
- char astr[100]; |
- |
- UErrorCode err; |
- |
- err = U_ZERO_ERROR; |
- wcs = u_strToWCS(ws, wcap, &wl, ustr, ul, &err); |
- if (U_FAILURE(err)) { |
- errname = u_errorName(err); |
- log_err("test_widestrs: u_strToWCS error: %s!\n",errname); |
- } |
- if(ul!=wl){ |
- log_err("u_strToWCS: ustr = %s, ul = %d, ws = %S, wl = %d!\n", u_austrcpy(astr, ustr), ul, ws, wl); |
- } |
- err = U_ZERO_ERROR; |
- wl = (int32_t)uprv_wcslen(wcs); |
- cp = u_strFromWCS(rts, rtcap, &rtl, wcs, wl, &err); |
- (void)cp; /* Suppress set but not used warning. */ |
- if (U_FAILURE(err)) { |
- errname = u_errorName(err); |
- fprintf(stderr, "test_widestrs: ucnv_wcstombs error: %s!\n",errname); |
- } |
- if(wl != rtl){ |
- log_err("u_strFromWCS: wcs = %S, wl = %d,rts = %s, rtl = %d!\n", wcs, wl, u_austrcpy(astr, rts), rtl); |
- } |
-#else |
- log_info("Not testing u_str*WCS because (!UCONFIG_NO_CONVERSION && !UCONFIG_NO_LEGACY_CONVERSION) and wchar is neither utf16 nor utf32"); |
-#endif |
-} |
- |
-static void |
-Test_WCHART_LongString(){ |
-#if (defined(U_WCHAR_IS_UTF16) || defined(U_WCHAR_IS_UTF32)) || (!UCONFIG_NO_CONVERSION && !UCONFIG_NO_LEGACY_CONVERSION) |
- UErrorCode status = U_ZERO_ERROR; |
- const char* testdatapath=loadTestData(&status); |
- UResourceBundle *theBundle = ures_open(testdatapath, "testtypes", &status); |
- int32_t strLen =0; |
- const UChar* str = ures_getStringByKey(theBundle, "testinclude",&strLen,&status); |
- const UChar* uSrc = str; |
- int32_t uSrcLen = strLen; |
- int32_t wDestLen =0, reqLen=0, i=0; |
- int32_t uDestLen =0; |
- wchar_t* wDest = NULL; |
- UChar* uDest = NULL; |
- UBool failed = FALSE; |
- |
- log_verbose("Loaded string of %d UChars\n", uSrcLen); |
- |
- if(U_FAILURE(status)){ |
- log_data_err("Could not get testinclude resource from testtypes bundle. Error: %s\n",u_errorName(status)); |
- return; |
- } |
- |
- /* pre-flight*/ |
- u_strToWCS(wDest,wDestLen,&reqLen,uSrc,-1,&status); |
- |
- if(status == U_BUFFER_OVERFLOW_ERROR){ |
- status=U_ZERO_ERROR; |
- wDest =(wchar_t*) malloc(sizeof(wchar_t) * (reqLen+1)); |
- wDestLen = reqLen+1; |
- u_strToWCS(wDest,wDestLen,&reqLen,uSrc,-1,&status); |
- log_verbose("To %d*%d-byte wchar_ts\n", reqLen,sizeof(wchar_t)); |
- } |
- |
- { |
- int j; |
- for(j=0;j>=0&&j<reqLen;j++) { |
- if(wDest[j]!=uSrc[j]) { |
- log_verbose("Diff %04X vs %04X @ %d\n", wDest[j],uSrc[j],j); |
- break; |
- } |
- } |
- } |
- |
- uDestLen = 0; |
- /* pre-flight */ |
- u_strFromWCS(uDest, uDestLen,&reqLen,wDest,-1,&status); |
- if(status == U_BUFFER_OVERFLOW_ERROR){ |
- status =U_ZERO_ERROR; |
- uDest = (UChar*) malloc(sizeof(UChar) * (reqLen+1)); |
- u_memset(uDest,0xFFFF,reqLen+1); |
- uDestLen = reqLen + 1; |
- u_strFromWCS(uDest, uDestLen,&reqLen,wDest,-1,&status); |
- log_verbose("Back to %d UChars\n", reqLen); |
- } |
-#if defined(U_WCHAR_IS_UTF16) |
- log_verbose("U_WCHAR_IS_UTF16\n"); |
-#elif defined(U_WCHAR_IS_UTF32) |
- log_verbose("U_WCHAR_IS_UTF32\n"); |
-#else |
- log_verbose("U_WCHAR_IS_idunno (not UTF)\n"); |
-#endif |
- |
- if(reqLen!=uSrcLen) { |
- log_err("Error: dest len is %d but expected src len %d\n", reqLen, uSrcLen); |
- } |
- |
- for(i=0; i< uSrcLen; i++){ |
- if(uDest[i] != str[i]){ |
- log_verbose("u_str*WCS() failed for null terminated string expected: \\u%04X got: \\u%04X at index: %i \n", str[i], uDest[i],i); |
- failed =TRUE; |
- } |
- } |
- |
- if(U_FAILURE(status)){ |
- failed = TRUE; |
- } |
- if(failed){ |
- log_err("u_strToWCS() failed \n"); |
- } |
- free(wDest); |
- free(uDest); |
- /* close the bundle */ |
- ures_close(theBundle); |
-#else |
- log_info("Not testing u_str*WCS because (!UCONFIG_NO_CONVERSION && !UCONFIG_NO_LEGACY_CONVERSION) and wchar is neither utf16 nor utf32"); |
-#endif |
-} |
- |
-static void Test_strToJavaModifiedUTF8() { |
- static const UChar src[]={ |
- 0x61, 0x62, 0x63, 0xe1, 0xe2, 0xe3, |
- 0xe01, 0xe02, 0xe03, 0xe001, 0xe002, 0xe003, |
- 0xd800, 0xdc00, 0xdc00, 0xd800, 0, |
- 0xdbff, 0xdfff, |
- 0x64, 0x65, 0x66, 0x67, 0x68, 0x69, 0x6a, 0x6b, 0x6c, 0xed, 0xe0e, 0x6f |
- }; |
- static const uint8_t expected[]={ |
- 0x61, 0x62, 0x63, 0xc3, 0xa1, 0xc3, 0xa2, 0xc3, 0xa3, |
- 0xe0, 0xb8, 0x81, 0xe0, 0xb8, 0x82, 0xe0, 0xb8, 0x83, |
- 0xee, 0x80, 0x81, 0xee, 0x80, 0x82, 0xee, 0x80, 0x83, |
- 0xed, 0xa0, 0x80, 0xed, 0xb0, 0x80, 0xed, 0xb0, 0x80, 0xed, 0xa0, 0x80, 0xc0, 0x80, |
- 0xed, 0xaf, 0xbf, 0xed, 0xbf, 0xbf, |
- 0x64, 0x65, 0x66, 0x67, 0x68, 0x69, 0x6a, 0x6b, 0x6c, 0xc3, 0xad, 0xe0, 0xb8, 0x8e, 0x6f |
- }; |
- static const UChar shortSrc[]={ |
- 0xe01, 0xe1, 0x61 |
- }; |
- static const uint8_t shortExpected[]={ |
- 0xe0, 0xb8, 0x81, 0xc3, 0xa1, 0x61 |
- }; |
- static const UChar asciiNul[]={ |
- 0x61, 0x62, 0x63, 0 |
- }; |
- static const uint8_t asciiNulExpected[]={ |
- 0x61, 0x62, 0x63 |
- }; |
- char dest[200]; |
- char *p; |
- int32_t length, expectedTerminatedLength; |
- UErrorCode errorCode; |
- |
- expectedTerminatedLength=(int32_t)(strstr((const char *)expected, "\xc0\x80")- |
- (const char *)expected); |
- |
- errorCode=U_ZERO_ERROR; |
- length=-5; |
- p=u_strToJavaModifiedUTF8(dest, (int32_t)sizeof(dest), &length, |
- src, UPRV_LENGTHOF(src), &errorCode); |
- if( U_FAILURE(errorCode) || p!=dest || |
- length!=UPRV_LENGTHOF(expected) || 0!=memcmp(dest, expected, length) || |
- dest[length]!=0 |
- ) { |
- log_err("u_strToJavaModifiedUTF8(normal) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=-5; |
- p=u_strToJavaModifiedUTF8(dest, (int32_t)sizeof(dest), NULL, |
- src, UPRV_LENGTHOF(src), &errorCode); |
- if( U_FAILURE(errorCode) || p!=dest || |
- 0!=memcmp(dest, expected, UPRV_LENGTHOF(expected)) || |
- dest[UPRV_LENGTHOF(expected)]!=0 |
- ) { |
- log_err("u_strToJavaModifiedUTF8(normal, pLength=NULL) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=-5; |
- p=u_strToJavaModifiedUTF8(dest, UPRV_LENGTHOF(expected), &length, |
- src, UPRV_LENGTHOF(src), &errorCode); |
- if( errorCode!=U_STRING_NOT_TERMINATED_WARNING || p!=dest || |
- length!=UPRV_LENGTHOF(expected) || 0!=memcmp(dest, expected, length) || |
- dest[length]!=(char)0xff |
- ) { |
- log_err("u_strToJavaModifiedUTF8(tight) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=-5; |
- p=u_strToJavaModifiedUTF8(dest, (int32_t)sizeof(dest), &length, src, -1, &errorCode); |
- if( U_FAILURE(errorCode) || p!=dest || |
- length!=expectedTerminatedLength || 0!=memcmp(dest, expected, length) || |
- dest[length]!=0 |
- ) { |
- log_err("u_strToJavaModifiedUTF8(NUL-terminated) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=-5; |
- p=u_strToJavaModifiedUTF8(dest, (int32_t)sizeof(dest), NULL, src, -1, &errorCode); |
- if( U_FAILURE(errorCode) || p!=dest || |
- 0!=memcmp(dest, expected, expectedTerminatedLength) || |
- dest[expectedTerminatedLength]!=0 |
- ) { |
- log_err("u_strToJavaModifiedUTF8(NUL-terminated, pLength=NULL) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=-5; |
- p=u_strToJavaModifiedUTF8(dest, UPRV_LENGTHOF(expected)/2, &length, |
- src, UPRV_LENGTHOF(src), &errorCode); |
- if( errorCode!=U_BUFFER_OVERFLOW_ERROR || |
- length!=UPRV_LENGTHOF(expected) || dest[UPRV_LENGTHOF(expected)/2]!=(char)0xff |
- ) { |
- log_err("u_strToJavaModifiedUTF8(overflow) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=-5; |
- p=u_strToJavaModifiedUTF8(NULL, 0, &length, |
- src, UPRV_LENGTHOF(src), &errorCode); |
- if( errorCode!=U_BUFFER_OVERFLOW_ERROR || |
- length!=UPRV_LENGTHOF(expected) || dest[0]!=(char)0xff |
- ) { |
- log_err("u_strToJavaModifiedUTF8(pure preflighting) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=-5; |
- p=u_strToJavaModifiedUTF8(dest, (int32_t)sizeof(dest), &length, |
- shortSrc, UPRV_LENGTHOF(shortSrc), &errorCode); |
- if( U_FAILURE(errorCode) || p!=dest || |
- length!=UPRV_LENGTHOF(shortExpected) || 0!=memcmp(dest, shortExpected, length) || |
- dest[length]!=0 |
- ) { |
- log_err("u_strToJavaModifiedUTF8(short) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=-5; |
- p=u_strToJavaModifiedUTF8(dest, (int32_t)sizeof(dest), &length, |
- asciiNul, -1, &errorCode); |
- if( U_FAILURE(errorCode) || p!=dest || |
- length!=UPRV_LENGTHOF(asciiNulExpected) || 0!=memcmp(dest, asciiNulExpected, length) || |
- dest[length]!=0 |
- ) { |
- log_err("u_strToJavaModifiedUTF8(asciiNul) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=-5; |
- p=u_strToJavaModifiedUTF8(dest, (int32_t)sizeof(dest), &length, |
- NULL, 0, &errorCode); |
- if( U_FAILURE(errorCode) || p!=dest || |
- length!=0 || dest[0]!=0 |
- ) { |
- log_err("u_strToJavaModifiedUTF8(empty) failed - %s\n", u_errorName(errorCode)); |
- } |
- |
- /* illegal arguments */ |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=-5; |
- p=u_strToJavaModifiedUTF8(NULL, sizeof(dest), &length, |
- src, UPRV_LENGTHOF(src), &errorCode); |
- if(errorCode!=U_ILLEGAL_ARGUMENT_ERROR || dest[0]!=(char)0xff) { |
- log_err("u_strToJavaModifiedUTF8(dest=NULL) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=-5; |
- p=u_strToJavaModifiedUTF8(dest, -1, &length, |
- src, UPRV_LENGTHOF(src), &errorCode); |
- if(errorCode!=U_ILLEGAL_ARGUMENT_ERROR || dest[0]!=(char)0xff) { |
- log_err("u_strToJavaModifiedUTF8(destCapacity<0) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=-5; |
- p=u_strToJavaModifiedUTF8(dest, sizeof(dest), &length, |
- NULL, UPRV_LENGTHOF(src), &errorCode); |
- if(errorCode!=U_ILLEGAL_ARGUMENT_ERROR || dest[0]!=(char)0xff) { |
- log_err("u_strToJavaModifiedUTF8(src=NULL) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=-5; |
- p=u_strToJavaModifiedUTF8(dest, sizeof(dest), &length, |
- NULL, -1, &errorCode); |
- if(errorCode!=U_ILLEGAL_ARGUMENT_ERROR || dest[0]!=(char)0xff) { |
- log_err("u_strToJavaModifiedUTF8(src=NULL, srcLength<0) failed - %s\n", u_errorName(errorCode)); |
- } |
-} |
- |
-static void Test_strFromJavaModifiedUTF8() { |
- static const uint8_t src[]={ |
- 0x61, 0x62, 0x63, 0xc3, 0xa1, 0xc3, 0xa2, 0xc3, 0xa3, |
- 0xe0, 0xb8, 0x81, 0xe0, 0xb8, 0x82, 0xe0, 0xb8, 0x83, |
- 0xee, 0x80, 0x81, 0xee, 0x80, 0x82, 0xee, 0x80, 0x83, |
- 0xed, 0xa0, 0x80, 0xed, 0xb0, 0x80, 0xed, 0xb0, 0x80, 0xed, 0xa0, 0x80, 0, |
- 0xed, 0xaf, 0xbf, 0xed, 0xbf, 0xbf, |
- 0x81, 0xc0, 0xe0, 0xb8, 0xf0, 0x90, 0x80, 0x80, /* invalid sequences */ |
- 0x64, 0x65, 0x66, 0x67, 0x68, 0x69, 0x6a, 0x6b, |
- 0xe0, 0x81, 0xac, 0xe0, 0x83, 0xad, /* non-shortest forms are allowed */ |
- 0xe0, 0xb8, 0x8e, 0x6f |
- }; |
- static const UChar expected[]={ |
- 0x61, 0x62, 0x63, 0xe1, 0xe2, 0xe3, |
- 0xe01, 0xe02, 0xe03, 0xe001, 0xe002, 0xe003, |
- 0xd800, 0xdc00, 0xdc00, 0xd800, 0, |
- 0xdbff, 0xdfff, |
- 0xfffd, 0xfffd, 0xfffd, 0xfffd, |
- 0x64, 0x65, 0x66, 0x67, 0x68, 0x69, 0x6a, 0x6b, |
- 0x6c, 0xed, |
- 0xe0e, 0x6f |
- }; |
- static const uint8_t shortSrc[]={ |
- 0xe0, 0xb8, 0x81, 0xc3, 0xa1, 0x61 |
- }; |
- static const UChar shortExpected[]={ |
- 0xe01, 0xe1, 0x61 |
- }; |
- static const uint8_t asciiNul[]={ |
- 0x61, 0x62, 0x63, 0 |
- }; |
- static const UChar asciiNulExpected[]={ |
- 0x61, 0x62, 0x63 |
- }; |
- static const uint8_t invalid[]={ |
- 0x81, 0xc0, 0xe0, 0xb8, 0xf0, 0x90, 0x80, 0x80 |
- }; |
- static const UChar invalidExpectedFFFD[]={ |
- 0xfffd, 0xfffd, 0xfffd, 0xfffd |
- }; |
- static const UChar invalidExpected50000[]={ |
- 0xd900, 0xdc00, 0xd900, 0xdc00, 0xd900, 0xdc00, 0xd900, 0xdc00 |
- }; |
- UChar dest[200]; |
- UChar *p; |
- int32_t length, expectedTerminatedLength; |
- int32_t numSubstitutions; |
- UErrorCode errorCode; |
- |
- expectedTerminatedLength=(int32_t)(u_strchr(expected, 0)-expected); |
- |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, (int32_t)sizeof(dest), &length, |
- (const char *)src, UPRV_LENGTHOF(src), |
- 0xfffd, &numSubstitutions, &errorCode); |
- if( U_FAILURE(errorCode) || p!=dest || |
- length!=UPRV_LENGTHOF(expected) || 0!=memcmp(dest, expected, length) || |
- dest[length]!=0 || |
- numSubstitutions!=UPRV_LENGTHOF(invalidExpectedFFFD) |
- ) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(normal) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, (int32_t)sizeof(dest), NULL, |
- (const char *)src, UPRV_LENGTHOF(src), |
- 0xfffd, &numSubstitutions, &errorCode); |
- if( U_FAILURE(errorCode) || p!=dest || |
- 0!=memcmp(dest, expected, UPRV_LENGTHOF(expected)) || |
- dest[UPRV_LENGTHOF(expected)]!=0 || |
- numSubstitutions!=UPRV_LENGTHOF(invalidExpectedFFFD) |
- ) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(normal, pLength=NULL) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, (int32_t)sizeof(dest), &length, |
- (const char *)src, UPRV_LENGTHOF(src), |
- 0xfffd, NULL, &errorCode); |
- if( U_FAILURE(errorCode) || p!=dest || |
- length!=UPRV_LENGTHOF(expected) || 0!=memcmp(dest, expected, length) || |
- dest[length]!=0 |
- ) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(normal, pNumSubstitutions=NULL) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, UPRV_LENGTHOF(expected), &length, |
- (const char *)src, UPRV_LENGTHOF(src), |
- 0xfffd, &numSubstitutions, &errorCode); |
- if( errorCode!=U_STRING_NOT_TERMINATED_WARNING || p!=dest || |
- length!=UPRV_LENGTHOF(expected) || 0!=memcmp(dest, expected, length) || |
- dest[length]!=0xffff || |
- numSubstitutions!=UPRV_LENGTHOF(invalidExpectedFFFD) |
- ) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(tight) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, (int32_t)sizeof(dest), &length, |
- (const char *)src, -1, |
- 0xfffd, &numSubstitutions, &errorCode); |
- if( U_FAILURE(errorCode) || p!=dest || |
- length!=expectedTerminatedLength || 0!=memcmp(dest, expected, length) || |
- dest[length]!=0 || |
- numSubstitutions!=0 |
- ) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(NUL-terminated) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, (int32_t)sizeof(dest), NULL, |
- (const char *)src, -1, |
- 0xfffd, &numSubstitutions, &errorCode); |
- if( U_FAILURE(errorCode) || p!=dest || |
- 0!=memcmp(dest, expected, expectedTerminatedLength) || |
- dest[expectedTerminatedLength]!=0 || |
- numSubstitutions!=0 |
- ) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(NUL-terminated, pLength=NULL) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, (int32_t)sizeof(dest), &length, |
- (const char *)src, -1, |
- 0xfffd, NULL, &errorCode); |
- if( U_FAILURE(errorCode) || p!=dest || |
- length!=expectedTerminatedLength || 0!=memcmp(dest, expected, length) || |
- dest[length]!=0 |
- ) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(NUL-terminated, pNumSubstitutions=NULL) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, UPRV_LENGTHOF(expected)/2, &length, |
- (const char *)src, UPRV_LENGTHOF(src), |
- 0xfffd, &numSubstitutions, &errorCode); |
- if( errorCode!=U_BUFFER_OVERFLOW_ERROR || |
- length!=UPRV_LENGTHOF(expected) || dest[UPRV_LENGTHOF(expected)/2]!=0xffff |
- ) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(overflow) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(NULL, 0, &length, |
- (const char *)src, UPRV_LENGTHOF(src), |
- 0xfffd, &numSubstitutions, &errorCode); |
- if( errorCode!=U_BUFFER_OVERFLOW_ERROR || |
- length!=UPRV_LENGTHOF(expected) || dest[0]!=0xffff |
- ) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(pure preflighting) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, (int32_t)sizeof(dest), &length, |
- (const char *)shortSrc, UPRV_LENGTHOF(shortSrc), |
- 0xfffd, &numSubstitutions, &errorCode); |
- if( U_FAILURE(errorCode) || p!=dest || |
- length!=UPRV_LENGTHOF(shortExpected) || 0!=memcmp(dest, shortExpected, length) || |
- dest[length]!=0 || |
- numSubstitutions!=0 |
- ) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(short) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, (int32_t)sizeof(dest), &length, |
- (const char *)asciiNul, -1, |
- 0xfffd, &numSubstitutions, &errorCode); |
- if( U_FAILURE(errorCode) || p!=dest || |
- length!=UPRV_LENGTHOF(asciiNulExpected) || 0!=memcmp(dest, asciiNulExpected, length) || |
- dest[length]!=0 || |
- numSubstitutions!=0 |
- ) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(asciiNul) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, (int32_t)sizeof(dest), &length, |
- NULL, 0, 0xfffd, &numSubstitutions, &errorCode); |
- if( U_FAILURE(errorCode) || p!=dest || |
- length!=0 || dest[0]!=0 || |
- numSubstitutions!=0 |
- ) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(empty) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, (int32_t)sizeof(dest), &length, |
- (const char *)invalid, UPRV_LENGTHOF(invalid), |
- 0xfffd, &numSubstitutions, &errorCode); |
- if( U_FAILURE(errorCode) || p!=dest || |
- length!=UPRV_LENGTHOF(invalidExpectedFFFD) || 0!=memcmp(dest, invalidExpectedFFFD, length) || |
- dest[length]!=0 || |
- numSubstitutions!=UPRV_LENGTHOF(invalidExpectedFFFD) |
- ) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(invalid->fffd) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, (int32_t)sizeof(dest), &length, |
- (const char *)invalid, UPRV_LENGTHOF(invalid), |
- 0x50000, &numSubstitutions, &errorCode); |
- if( U_FAILURE(errorCode) || p!=dest || |
- length!=UPRV_LENGTHOF(invalidExpected50000) || 0!=memcmp(dest, invalidExpected50000, length) || |
- dest[length]!=0 || |
- numSubstitutions!=UPRV_LENGTHOF(invalidExpectedFFFD) /* not ...50000 */ |
- ) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(invalid->50000) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, (int32_t)sizeof(dest), &length, |
- (const char *)invalid, UPRV_LENGTHOF(invalid), |
- U_SENTINEL, &numSubstitutions, &errorCode); |
- if(errorCode!=U_INVALID_CHAR_FOUND || dest[0]!=0xffff || numSubstitutions!=0) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(invalid->error) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, (int32_t)sizeof(dest), &length, |
- (const char *)src, UPRV_LENGTHOF(src), |
- U_SENTINEL, &numSubstitutions, &errorCode); |
- if( errorCode!=U_INVALID_CHAR_FOUND || |
- length>=UPRV_LENGTHOF(expected) || dest[UPRV_LENGTHOF(expected)-1]!=0xffff || |
- numSubstitutions!=0 |
- ) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(normal->error) failed - %s\n", u_errorName(errorCode)); |
- } |
- |
- /* illegal arguments */ |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(NULL, sizeof(dest), &length, |
- (const char *)src, UPRV_LENGTHOF(src), |
- 0xfffd, &numSubstitutions, &errorCode); |
- if(errorCode!=U_ILLEGAL_ARGUMENT_ERROR || dest[0]!=0xffff) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(dest=NULL) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, -1, &length, |
- (const char *)src, UPRV_LENGTHOF(src), |
- 0xfffd, &numSubstitutions, &errorCode); |
- if(errorCode!=U_ILLEGAL_ARGUMENT_ERROR || dest[0]!=0xffff) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(destCapacity<0) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, sizeof(dest), &length, |
- NULL, UPRV_LENGTHOF(src), |
- 0xfffd, &numSubstitutions, &errorCode); |
- if(errorCode!=U_ILLEGAL_ARGUMENT_ERROR || dest[0]!=0xffff) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(src=NULL) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, sizeof(dest), &length, |
- NULL, -1, 0xfffd, &numSubstitutions, &errorCode); |
- if(errorCode!=U_ILLEGAL_ARGUMENT_ERROR || dest[0]!=0xffff) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(src=NULL, srcLength<0) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, sizeof(dest), &length, |
- (const char *)src, UPRV_LENGTHOF(src), |
- 0x110000, &numSubstitutions, &errorCode); |
- if(errorCode!=U_ILLEGAL_ARGUMENT_ERROR || dest[0]!=0xffff) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(subchar=U_SENTINEL) failed - %s\n", u_errorName(errorCode)); |
- } |
- memset(dest, 0xff, sizeof(dest)); |
- errorCode=U_ZERO_ERROR; |
- length=numSubstitutions=-5; |
- p=u_strFromJavaModifiedUTF8WithSub(dest, sizeof(dest), &length, |
- (const char *)src, UPRV_LENGTHOF(src), |
- 0xdfff, &numSubstitutions, &errorCode); |
- if(errorCode!=U_ILLEGAL_ARGUMENT_ERROR || dest[0]!=0xffff) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(subchar is surrogate) failed - %s\n", u_errorName(errorCode)); |
- } |
-} |
- |
-/* test that string transformation functions permit NULL source pointer when source length==0 */ |
-static void TestNullEmptySource() { |
- char dest8[4]={ 3, 3, 3, 3 }; |
- UChar dest16[4]={ 3, 3, 3, 3 }; |
- UChar32 dest32[4]={ 3, 3, 3, 3 }; |
-#if (defined(U_WCHAR_IS_UTF16) || defined(U_WCHAR_IS_UTF32)) || (!UCONFIG_NO_CONVERSION && !UCONFIG_NO_LEGACY_CONVERSION) |
- wchar_t destW[4]={ 3, 3, 3, 3 }; |
-#endif |
- |
- int32_t length; |
- UErrorCode errorCode; |
- |
- /* u_strFromXyz() */ |
- |
- dest16[0]=3; |
- length=3; |
- errorCode=U_ZERO_ERROR; |
- u_strFromUTF8(dest16, UPRV_LENGTHOF(dest16), &length, NULL, 0, &errorCode); |
- if(errorCode!=U_ZERO_ERROR || length!=0 || dest16[0]!=0 || dest16[1]!=3) { |
- log_err("u_strFromUTF8(source=NULL, sourceLength=0) failed\n"); |
- } |
- |
- dest16[0]=3; |
- length=3; |
- errorCode=U_ZERO_ERROR; |
- u_strFromUTF8WithSub(dest16, UPRV_LENGTHOF(dest16), &length, NULL, 0, 0xfffd, NULL, &errorCode); |
- if(errorCode!=U_ZERO_ERROR || length!=0 || dest16[0]!=0 || dest16[1]!=3) { |
- log_err("u_strFromUTF8WithSub(source=NULL, sourceLength=0) failed\n"); |
- } |
- |
- dest16[0]=3; |
- length=3; |
- errorCode=U_ZERO_ERROR; |
- u_strFromUTF8Lenient(dest16, UPRV_LENGTHOF(dest16), &length, NULL, 0, &errorCode); |
- if(errorCode!=U_ZERO_ERROR || length!=0 || dest16[0]!=0 || dest16[1]!=3) { |
- log_err("u_strFromUTF8Lenient(source=NULL, sourceLength=0) failed\n"); |
- } |
- |
- dest16[0]=3; |
- length=3; |
- errorCode=U_ZERO_ERROR; |
- u_strFromUTF32(dest16, UPRV_LENGTHOF(dest16), &length, NULL, 0, &errorCode); |
- if(errorCode!=U_ZERO_ERROR || length!=0 || dest16[0]!=0 || dest16[1]!=3) { |
- log_err("u_strFromUTF32(source=NULL, sourceLength=0) failed\n"); |
- } |
- |
- dest16[0]=3; |
- length=3; |
- errorCode=U_ZERO_ERROR; |
- u_strFromUTF32WithSub(dest16, UPRV_LENGTHOF(dest16), &length, NULL, 0, 0xfffd, NULL, &errorCode); |
- if(errorCode!=U_ZERO_ERROR || length!=0 || dest16[0]!=0 || dest16[1]!=3) { |
- log_err("u_strFromUTF32WithSub(source=NULL, sourceLength=0) failed\n"); |
- } |
- |
- dest16[0]=3; |
- length=3; |
- errorCode=U_ZERO_ERROR; |
- u_strFromJavaModifiedUTF8WithSub(dest16, UPRV_LENGTHOF(dest16), &length, NULL, 0, 0xfffd, NULL, &errorCode); |
- if(errorCode!=U_ZERO_ERROR || length!=0 || dest16[0]!=0 || dest16[1]!=3) { |
- log_err("u_strFromJavaModifiedUTF8WithSub(source=NULL, sourceLength=0) failed\n"); |
- } |
- |
- /* u_strToXyz() */ |
- |
- dest8[0]=3; |
- length=3; |
- errorCode=U_ZERO_ERROR; |
- u_strToUTF8(dest8, UPRV_LENGTHOF(dest8), &length, NULL, 0, &errorCode); |
- if(errorCode!=U_ZERO_ERROR || length!=0 || dest8[0]!=0 || dest8[1]!=3) { |
- log_err("u_strToUTF8(source=NULL, sourceLength=0) failed\n"); |
- } |
- |
- dest8[0]=3; |
- length=3; |
- errorCode=U_ZERO_ERROR; |
- u_strToUTF8WithSub(dest8, UPRV_LENGTHOF(dest8), &length, NULL, 0, 0xfffd, NULL, &errorCode); |
- if(errorCode!=U_ZERO_ERROR || length!=0 || dest8[0]!=0 || dest8[1]!=3) { |
- log_err("u_strToUTF8(source=NULL, sourceLength=0) failed\n"); |
- } |
- |
- dest32[0]=3; |
- length=3; |
- errorCode=U_ZERO_ERROR; |
- u_strToUTF32(dest32, UPRV_LENGTHOF(dest32), &length, NULL, 0, &errorCode); |
- if(errorCode!=U_ZERO_ERROR || length!=0 || dest32[0]!=0 || dest32[1]!=3) { |
- log_err("u_strToUTF32(source=NULL, sourceLength=0) failed\n"); |
- } |
- |
- dest32[0]=3; |
- length=3; |
- errorCode=U_ZERO_ERROR; |
- u_strToUTF32WithSub(dest32, UPRV_LENGTHOF(dest32), &length, NULL, 0, 0xfffd, NULL, &errorCode); |
- if(errorCode!=U_ZERO_ERROR || length!=0 || dest32[0]!=0 || dest32[1]!=3) { |
- log_err("u_strToUTF32WithSub(source=NULL, sourceLength=0) failed\n"); |
- } |
- |
- dest8[0]=3; |
- length=3; |
- errorCode=U_ZERO_ERROR; |
- u_strToJavaModifiedUTF8(dest8, UPRV_LENGTHOF(dest8), &length, NULL, 0, &errorCode); |
- if(errorCode!=U_ZERO_ERROR || length!=0 || dest8[0]!=0 || dest8[1]!=3) { |
- log_err("u_strToJavaModifiedUTF8(source=NULL, sourceLength=0) failed\n"); |
- } |
- |
-#if (defined(U_WCHAR_IS_UTF16) || defined(U_WCHAR_IS_UTF32)) || (!UCONFIG_NO_CONVERSION && !UCONFIG_NO_LEGACY_CONVERSION) |
- |
- dest16[0]=3; |
- length=3; |
- errorCode=U_ZERO_ERROR; |
- u_strFromWCS(dest16, UPRV_LENGTHOF(dest16), &length, NULL, 0, &errorCode); |
- if(errorCode!=U_ZERO_ERROR || length!=0 || dest16[0]!=0 || dest16[1]!=3) { |
- log_err("u_strFromWCS(source=NULL, sourceLength=0) failed\n"); |
- } |
- |
- destW[0]=3; |
- length=3; |
- errorCode=U_ZERO_ERROR; |
- u_strToWCS(destW, UPRV_LENGTHOF(destW), &length, NULL, 0, &errorCode); |
- if(errorCode!=U_ZERO_ERROR || length!=0 || destW[0]!=0 || destW[1]!=3) { |
- log_err("u_strToWCS(source=NULL, sourceLength=0) failed\n"); |
- } |
- |
-#endif |
-} |