Index: icu46/source/test/cintltst/ncnvfbts.c |
=================================================================== |
--- icu46/source/test/cintltst/ncnvfbts.c (revision 0) |
+++ icu46/source/test/cintltst/ncnvfbts.c (revision 0) |
@@ -0,0 +1,757 @@ |
+/******************************************************************** |
+ * COPYRIGHT: |
+ * Copyright (c) 1997-2010, International Business Machines Corporation and |
+ * others. All Rights Reserved. |
+ ***************************************************************************/ |
+/***************************************************************************** |
+* |
+* File NCNVCBTS |
+* |
+* Modification History: |
+* Name Date Description |
+* Madhu Katragadda 06/23/2000 Tests for Conveter FallBack API and Functionality |
+****************************************************************************** |
+*/ |
+#include <stdio.h> |
+#include "unicode/uloc.h" |
+#include "unicode/ucnv.h" |
+#include "unicode/ucnv_err.h" |
+#include "cintltst.h" |
+#include "unicode/utypes.h" |
+#include "unicode/ustring.h" |
+#include "ncnvfbts.h" |
+#include "cmemory.h" |
+#include "cstring.h" |
+ |
+#if !UCONFIG_NO_LEGACY_CONVERSION |
+#define NEW_MAX_BUFFER 999 |
+ |
+ |
+#define nct_min(x,y) ((x<y) ? x : y) |
+ |
+static int32_t gInBufferSize = 0; |
+static int32_t gOutBufferSize = 0; |
+static char gNuConvTestName[1024]; |
+ |
+static UConverter *my_ucnv_open(const char *cnv, UErrorCode *err) |
+{ |
+ if(cnv && cnv[0] == '@') { |
+ return ucnv_openPackage("testdata", cnv+1, err); |
+ } else { |
+ return ucnv_open(cnv, err); |
+ } |
+} |
+ |
+ |
+static void printSeq(const unsigned char* a, int len) |
+{ |
+ int i=0; |
+ log_verbose("{"); |
+ while (i<len) |
+ log_verbose("0x%02x ", a[i++]); |
+ log_verbose("}\n"); |
+} |
+ |
+static void printUSeq(const UChar* a, int len) |
+{ |
+ int i=0; |
+ log_verbose("{U+"); |
+ while (i<len) |
+ log_verbose("0x%04x ", a[i++]); |
+ log_verbose("}\n"); |
+} |
+ |
+static void printSeqErr(const unsigned char* a, int len) |
+{ |
+ int i=0; |
+ fprintf(stderr, "{"); |
+ while (i<len) |
+ fprintf(stderr, "0x%02x ", a[i++]); |
+ fprintf(stderr, "}\n"); |
+} |
+ |
+static void printUSeqErr(const UChar* a, int len) |
+{ |
+ int i=0; |
+ fprintf(stderr, "{U+"); |
+ while (i<len) |
+ fprintf(stderr, "0x%04x ", a[i++]); |
+ fprintf(stderr,"}\n"); |
+} |
+ |
+static void TestConverterFallBack(void) |
+{ |
+ TestConvertFallBackWithBufferSizes(10,10); |
+ TestConvertFallBackWithBufferSizes(2,3); |
+ TestConvertFallBackWithBufferSizes(3,2); |
+ TestConvertFallBackWithBufferSizes(NEW_MAX_BUFFER,1); |
+ TestConvertFallBackWithBufferSizes(NEW_MAX_BUFFER,2); |
+ TestConvertFallBackWithBufferSizes(NEW_MAX_BUFFER,3); |
+ TestConvertFallBackWithBufferSizes(NEW_MAX_BUFFER,4); |
+ TestConvertFallBackWithBufferSizes(NEW_MAX_BUFFER,5); |
+ TestConvertFallBackWithBufferSizes(NEW_MAX_BUFFER,6); |
+ TestConvertFallBackWithBufferSizes(1,NEW_MAX_BUFFER); |
+ TestConvertFallBackWithBufferSizes(2,NEW_MAX_BUFFER); |
+ TestConvertFallBackWithBufferSizes(3,NEW_MAX_BUFFER); |
+ TestConvertFallBackWithBufferSizes(4,NEW_MAX_BUFFER); |
+ TestConvertFallBackWithBufferSizes(5,NEW_MAX_BUFFER); |
+ TestConvertFallBackWithBufferSizes(NEW_MAX_BUFFER,NEW_MAX_BUFFER); |
+ |
+} |
+ |
+ |
+void addTestConverterFallBack(TestNode** root); |
+ |
+void addTestConverterFallBack(TestNode** root) |
+{ |
+#if !UCONFIG_NO_FILE_IO |
+ addTest(root, &TestConverterFallBack, "tsconv/ncnvfbts/TestConverterFallBack"); |
+#endif |
+ |
+} |
+ |
+ |
+/* Note that this test already makes use of statics, so it's not really |
+ multithread safe. |
+ This convenience function lets us make the error messages actually useful. |
+*/ |
+ |
+static void setNuConvTestName(const char *codepage, const char *direction) |
+{ |
+ sprintf(gNuConvTestName, "[Testing %s %s Unicode, InputBufSiz=%d, OutputBufSiz=%d]", |
+ codepage, |
+ direction, |
+ (int)gInBufferSize, |
+ (int)gOutBufferSize); |
+} |
+ |
+ |
+static UBool testConvertFromUnicode(const UChar *source, int sourceLen, const uint8_t *expect, int expectLen, |
+ const char *codepage, UBool fallback, const int32_t *expectOffsets) |
+{ |
+ |
+ |
+ UErrorCode status = U_ZERO_ERROR; |
+ UConverter *conv = 0; |
+ char junkout[NEW_MAX_BUFFER]; /* FIX */ |
+ int32_t junokout[NEW_MAX_BUFFER]; /* FIX */ |
+ const UChar *src; |
+ char *end; |
+ char *targ; |
+ int32_t *offs; |
+ int i; |
+ int32_t realBufferSize; |
+ char *realBufferEnd; |
+ const UChar *realSourceEnd; |
+ const UChar *sourceLimit; |
+ UBool checkOffsets = TRUE; |
+ UBool doFlush; |
+ UBool action=FALSE; |
+ char *p; |
+ |
+ |
+ for(i=0;i<NEW_MAX_BUFFER;i++) |
+ junkout[i] = (char)0xF0; |
+ for(i=0;i<NEW_MAX_BUFFER;i++) |
+ junokout[i] = 0xFF; |
+ setNuConvTestName(codepage, "FROM"); |
+ |
+ log_verbose("\nTesting========= %s FROM \n inputbuffer= %d outputbuffer= %d\n", codepage, gInBufferSize, |
+ gOutBufferSize); |
+ |
+ conv = my_ucnv_open(codepage, &status); |
+ if(U_FAILURE(status)) |
+ { |
+ log_data_err("Couldn't open converter %s\n",codepage); |
+ return TRUE; |
+ } |
+ |
+ log_verbose("Converter opened..\n"); |
+ /*----setting the callback routine----*/ |
+ ucnv_setFallback (conv, fallback); |
+ action = ucnv_usesFallback(conv); |
+ if(action != fallback){ |
+ log_err("FAIL: Error is setting fallback. Errocode=%s\n", myErrorName(status)); |
+ } |
+ /*------------------------*/ |
+ src = source; |
+ targ = junkout; |
+ offs = junokout; |
+ |
+ realBufferSize = (sizeof(junkout)/sizeof(junkout[0])); |
+ realBufferEnd = junkout + realBufferSize; |
+ realSourceEnd = source + sourceLen; |
+ |
+ if ( gOutBufferSize != realBufferSize ) |
+ checkOffsets = FALSE; |
+ |
+ if( gInBufferSize != NEW_MAX_BUFFER ) |
+ checkOffsets = FALSE; |
+ |
+ do |
+ { |
+ end = nct_min(targ + gOutBufferSize, realBufferEnd); |
+ sourceLimit = nct_min(src + gInBufferSize, realSourceEnd); |
+ |
+ doFlush = (UBool)(sourceLimit == realSourceEnd); |
+ |
+ if(targ == realBufferEnd) |
+ { |
+ log_err("Error, overflowed the real buffer while about to call fromUnicode! targ=%08lx %s", targ, gNuConvTestName); |
+ return FALSE; |
+ } |
+ log_verbose("calling fromUnicode @ SOURCE:%08lx to %08lx TARGET: %08lx to %08lx, flush=%s\n", src,sourceLimit, targ,end, doFlush?"TRUE":"FALSE"); |
+ |
+ |
+ status = U_ZERO_ERROR; |
+ |
+ ucnv_fromUnicode (conv, |
+ (char **)&targ, |
+ (const char *)end, |
+ &src, |
+ sourceLimit, |
+ checkOffsets ? offs : NULL, |
+ doFlush, /* flush if we're at the end of the input data */ |
+ &status); |
+ |
+ } while ( (status == U_BUFFER_OVERFLOW_ERROR) || (sourceLimit < realSourceEnd) ); |
+ |
+ if(U_FAILURE(status)) |
+ { |
+ log_err("Problem doing toUnicode, errcode %d %s\n", myErrorName(status), gNuConvTestName); |
+ return FALSE; |
+ } |
+ |
+ log_verbose("\nConversion done [%d uchars in -> %d chars out]. \nResult :", |
+ sourceLen, targ-junkout); |
+ if(getTestOption(VERBOSITY_OPTION)) |
+ { |
+ char junk[9999]; |
+ char offset_str[9999]; |
+ |
+ junk[0] = 0; |
+ offset_str[0] = 0; |
+ for(p = junkout;p<targ;p++) |
+ { |
+ sprintf(junk + uprv_strlen(junk), "0x%02x, ", (0xFF) & (unsigned int)*p); |
+ sprintf(offset_str + strlen(offset_str), "0x%02x, ", (0xFF) & (unsigned int)junokout[p-junkout]); |
+ } |
+ |
+ log_verbose(junk); |
+ printSeq((const unsigned char*)expect, expectLen); |
+ if ( checkOffsets ) |
+ { |
+ log_verbose("\nOffsets:"); |
+ log_verbose(offset_str); |
+ } |
+ log_verbose("\n"); |
+ } |
+ ucnv_close(conv); |
+ |
+ |
+ if(expectLen != targ-junkout) |
+ { |
+ log_err("Expected %d chars out, got %d %s\n", expectLen, targ-junkout, gNuConvTestName); |
+ log_verbose("Expected %d chars out, got %d %s\n", expectLen, targ-junkout, gNuConvTestName); |
+ printSeqErr((const unsigned char*)junkout, (int32_t)(targ-junkout)); |
+ printSeqErr((const unsigned char*)expect, expectLen); |
+ return FALSE; |
+ } |
+ |
+ if (checkOffsets && (expectOffsets != 0) ) |
+ { |
+ log_verbose("\ncomparing %d offsets..\n", targ-junkout); |
+ if(uprv_memcmp(junokout,expectOffsets,(targ-junkout) * sizeof(int32_t) )){ |
+ log_err("\ndid not get the expected offsets while %s \n", gNuConvTestName); |
+ log_err("Got : "); |
+ printSeqErr((const unsigned char*)junkout, (int32_t)(targ-junkout)); |
+ for(p=junkout;p<targ;p++) |
+ log_err("%d, ", junokout[p-junkout]); |
+ log_err("\nExpected: "); |
+ for(i=0; i<(targ-junkout); i++) |
+ log_err("%d,", expectOffsets[i]); |
+ } |
+ } |
+ |
+ log_verbose("\n\ncomparing..\n"); |
+ if(!memcmp(junkout, expect, expectLen)) |
+ { |
+ log_verbose("Matches!\n"); |
+ return TRUE; |
+ } |
+ else |
+ { |
+ log_err("String does not match. %s\n", gNuConvTestName); |
+ log_verbose("String does not match. %s\n", gNuConvTestName); |
+ printSeqErr((const unsigned char*)junkout, expectLen); |
+ printSeqErr((const unsigned char*)expect, expectLen); |
+ return FALSE; |
+ } |
+} |
+ |
+static UBool testConvertToUnicode( const uint8_t *source, int sourcelen, const UChar *expect, int expectlen, |
+ const char *codepage, UBool fallback, const int32_t *expectOffsets) |
+{ |
+ UErrorCode status = U_ZERO_ERROR; |
+ UConverter *conv = 0; |
+ UChar junkout[NEW_MAX_BUFFER]; /* FIX */ |
+ int32_t junokout[NEW_MAX_BUFFER]; /* FIX */ |
+ const char *src; |
+ const char *realSourceEnd; |
+ const char *srcLimit; |
+ UChar *targ; |
+ UChar *end; |
+ int32_t *offs; |
+ int i; |
+ UBool checkOffsets = TRUE; |
+ char junk[9999]; |
+ char offset_str[9999]; |
+ UChar *p; |
+ UBool action; |
+ |
+ int32_t realBufferSize; |
+ UChar *realBufferEnd; |
+ |
+ |
+ for(i=0;i<NEW_MAX_BUFFER;i++) |
+ junkout[i] = 0xFFFE; |
+ |
+ for(i=0;i<NEW_MAX_BUFFER;i++) |
+ junokout[i] = -1; |
+ |
+ setNuConvTestName(codepage, "TO"); |
+ |
+ log_verbose("\n========= %s\n", gNuConvTestName); |
+ |
+ conv = my_ucnv_open(codepage, &status); |
+ if(U_FAILURE(status)) |
+ { |
+ log_data_err("Couldn't open converter %s\n",gNuConvTestName); |
+ return TRUE; /* because it has been logged */ |
+ } |
+ |
+ log_verbose("Converter opened..\n"); |
+ |
+ src = (const char *)source; |
+ targ = junkout; |
+ offs = junokout; |
+ |
+ realBufferSize = (sizeof(junkout)/sizeof(junkout[0])); |
+ realBufferEnd = junkout + realBufferSize; |
+ realSourceEnd = src + sourcelen; |
+ /*----setting the fallback routine----*/ |
+ ucnv_setFallback (conv, fallback); |
+ action = ucnv_usesFallback(conv); |
+ if(action != fallback){ |
+ log_err("FAIL: Error is setting fallback. Errocode=%s\n", myErrorName(status)); |
+ } |
+ /*-------------------------------------*/ |
+ if ( gOutBufferSize != realBufferSize ) |
+ checkOffsets = FALSE; |
+ |
+ if( gInBufferSize != NEW_MAX_BUFFER ) |
+ checkOffsets = FALSE; |
+ |
+ do |
+ { |
+ end = nct_min( targ + gOutBufferSize, realBufferEnd); |
+ srcLimit = nct_min(realSourceEnd, src + gInBufferSize); |
+ |
+ if(targ == realBufferEnd) |
+ { |
+ log_err("Error, the end would overflow the real output buffer while about to call toUnicode! tarjey=%08lx %s",targ,gNuConvTestName); |
+ return FALSE; |
+ } |
+ log_verbose("calling toUnicode @ %08lx to %08lx\n", targ,end); |
+ |
+ |
+ |
+ status = U_ZERO_ERROR; |
+ |
+ ucnv_toUnicode (conv, |
+ &targ, |
+ end, |
+ (const char **)&src, |
+ (const char *)srcLimit, |
+ checkOffsets ? offs : NULL, |
+ (UBool)(srcLimit == realSourceEnd), /* flush if we're at the end of hte source data */ |
+ &status); |
+ } while ( (status == U_BUFFER_OVERFLOW_ERROR) || (srcLimit < realSourceEnd) ); /* while we just need another buffer */ |
+ |
+ |
+ if(U_FAILURE(status)) |
+ { |
+ log_err("Problem doing toUnicode, errcode %s %s\n", myErrorName(status), gNuConvTestName); |
+ return FALSE; |
+ } |
+ |
+ log_verbose("\nConversion done. %d bytes -> %d chars.\nResult :", |
+ sourcelen, targ-junkout); |
+ if(getTestOption(VERBOSITY_OPTION)) |
+ { |
+ |
+ junk[0] = 0; |
+ offset_str[0] = 0; |
+ |
+ for(p = junkout;p<targ;p++) |
+ { |
+ sprintf(junk + strlen(junk), "0x%04x, ", (0xFFFF) & (unsigned int)*p); |
+ sprintf(offset_str + strlen(offset_str), "0x%04x, ", (0xFFFF) & (unsigned int)junokout[p-junkout]); |
+ } |
+ |
+ log_verbose(junk); |
+ printUSeq(expect, expectlen); |
+ if ( checkOffsets ) |
+ { |
+ log_verbose("\nOffsets:"); |
+ log_verbose(offset_str); |
+ } |
+ log_verbose("\n"); |
+ } |
+ ucnv_close(conv); |
+ |
+ log_verbose("comparing %d uchars (%d bytes)..\n",expectlen,expectlen*2); |
+ |
+ if (checkOffsets && (expectOffsets != 0)) |
+ { |
+ if(memcmp(junokout,expectOffsets,(targ-junkout) * sizeof(int32_t))) |
+ { |
+ log_err("\n\ndid not get the expected offsets while %s \n", gNuConvTestName); |
+ log_err("\nGot : "); |
+ for(p=junkout;p<targ;p++) |
+ log_err("%d, ", junokout[p-junkout]); |
+ log_err("\nExpected: "); |
+ for(i=0; i<(targ-junkout); i++) |
+ log_err("%d,", expectOffsets[i]); |
+ log_err(""); |
+ for(i=0; i<(targ-junkout); i++) |
+ log_err("0x%04X,", junkout[i]); |
+ log_err(""); |
+ for(i=0; i<(src-(const char *)source); i++) |
+ log_err("0x%04X,", (unsigned char)source[i]); |
+ } |
+ } |
+ |
+ if(!memcmp(junkout, expect, expectlen*2)) |
+ { |
+ log_verbose("Matches!\n"); |
+ return TRUE; |
+ } |
+ else |
+ { |
+ log_err("String does not match. %s\n", gNuConvTestName); |
+ log_verbose("String does not match. %s\n", gNuConvTestName); |
+ printUSeqErr(junkout, expectlen); |
+ printf("\n"); |
+ printUSeqErr(expect, expectlen); |
+ return FALSE; |
+ } |
+} |
+ |
+ |
+ |
+static void TestConvertFallBackWithBufferSizes(int32_t outsize, int32_t insize ) |
+{ |
+ |
+ static const UChar SBCSText[] = |
+ { 0x0021, 0xFF01, 0x0022, 0xFF02, 0x0023, 0xFF03, 0x003A, 0xFF1A, 0x003B, 0xFF1B, 0x003C, 0xFF1C }; |
+ /* 21, ?, 22, ?, 23, ?, 3a, ?, 3b, ?, 3c, ? SBCS*/ |
+ static const uint8_t expectedNative[] = |
+ { 0x21, 0x21, 0x22, 0x22, 0x23, 0x23, 0x3a, 0x3a, 0x3b, 0x3b, 0x3c, 0x3c}; |
+ static const UChar retrievedSBCSText[]= |
+ { 0x0021, 0x0021, 0x0022, 0x0022, 0x0023, 0x0023, 0x003A, 0x003A, 0x003B, 0x003B, 0x003C, 0x003C }; |
+ static const int32_t toNativeOffs [] = |
+ { 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0a, 0x0b}; |
+ static const int32_t fromNativeoffs [] = |
+ { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11}; |
+ |
+ |
+ /* 1363 isn't DBCS, but it has the DBCS section */ |
+ static const UChar DBCSText[] = |
+ { 0x00a1, 0x00ad, 0x2010, 0x00b7, 0x30fb}; |
+ static const uint8_t expectedIBM1363_DBCS[] = |
+ { 0xa2, 0xae, 0xa1 ,0xa9, 0xa1, 0xa9,0xa1 ,0xa4, 0xa1, 0xa4}; |
+ static const UChar retrievedDBCSText[]= |
+ { 0x00a1, 0x2010, 0x2010, 0x30fb, 0x30fb }; |
+ static const int32_t toIBM1363Offs_DBCS[] = |
+ { 0x00, 0x00, 0x01,0x01, 0x02, 0x02, 0x03, 0x03, 0x04, 0x04}; |
+ static const int32_t fromIBM1363offs_DBCS[] = |
+ { 0, 2, 4, 6, 8}; |
+ |
+ |
+ static const UChar MBCSText[] = |
+ { 0x0001, 0x263a, 0x2013, 0x2014, 0x263b, 0x0002}; |
+ static const uint8_t expectedIBM950[] = |
+ { 0x01, 0x01, 0xa1, 0x56, 0xa1, 0x56, 0x02, 0x02}; |
+ static const UChar retrievedMBCSText[]= |
+ { 0x0001, 0x0001, 0x2014, 0x2014, 0x0002, 0x0002}; |
+ static const int32_t toIBM950Offs [] = |
+ { 0x00, 0x01, 0x02, 0x02, 0x03, 0x03, 0x04, 0x05}; |
+ static const int32_t fromIBM950offs [] = |
+ { 0, 1, 2, 4, 6, 7}; |
+ |
+ static const UChar MBCSText1363[] = |
+ { 0x0005, |
+ 0xffe8, |
+ 0x0007, |
+ 0x2022, |
+ 0x005c, |
+ 0x00b7, |
+ 0x3016, |
+ 0x30fb, |
+ 0x9a36}; |
+ static const uint8_t expectedIBM1363[] = |
+ { 0x05, |
+ 0x05, |
+ 0x07, |
+ 0x07, |
+ 0x7f, |
+ 0xa1, 0xa4, |
+ 0xa1, 0xe0, |
+ 0xa1, 0xa4, |
+ 0xf5, 0xe2}; |
+ static const UChar retrievedMBCSText1363[]= |
+ { 0x0005, 0x0005, 0x0007, 0x0007, 0x001a, 0x30fb, 0x25a1, 0x30fb, 0x9a36}; |
+ static const int32_t toIBM1363Offs [] = |
+ { 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x05, 0x06, 0x06, 0x07, 0x07, 0x08, 0x08}; |
+ static const int32_t fromIBM1363offs [] = |
+ { 0, 1, 2, 3, 4, 5, 7, 9, 11}; |
+ |
+ |
+ |
+ static const char* nativeCodePage[]={ |
+ /*NLCS Mapping*/ |
+ "ibm-437", |
+ "ibm-850", |
+ "ibm-878", |
+ "ibm-923", |
+ "ibm-1051", |
+ "ibm-1089", |
+ "ibm-1250", |
+ "ibm-1251", |
+ "ibm-1253", |
+ "ibm-1254", |
+ "ibm-1255", |
+ "ibm-1256", |
+ "ibm-1257", |
+ "ibm-1258", |
+ "ibm-1276" |
+ }; |
+ |
+ int32_t i=0; |
+ gInBufferSize = insize; |
+ gOutBufferSize = outsize; |
+ |
+ for(i=0; i<sizeof(nativeCodePage)/sizeof(nativeCodePage[0]); i++){ |
+ log_verbose("Testing %s\n", nativeCodePage[i]); |
+ if(!testConvertFromUnicode(SBCSText, sizeof(SBCSText)/sizeof(SBCSText[0]), |
+ expectedNative, sizeof(expectedNative), nativeCodePage[i], TRUE, toNativeOffs )) |
+ log_err("u-> %s(SBCS) with FallBack did not match.\n", nativeCodePage[i]); |
+ |
+ if(!testConvertToUnicode(expectedNative, sizeof(expectedNative), |
+ retrievedSBCSText, sizeof(retrievedSBCSText)/sizeof(retrievedSBCSText[0]), nativeCodePage[i], TRUE, fromNativeoffs )) |
+ log_err("%s->u(SBCS) with Fallback did not match.\n", nativeCodePage[i]); |
+ } |
+ |
+ /*DBCS*/ |
+ if(!testConvertFromUnicode(DBCSText, sizeof(DBCSText)/sizeof(DBCSText[0]), |
+ expectedIBM1363_DBCS, sizeof(expectedIBM1363_DBCS), "ibm-1363", TRUE, toIBM1363Offs_DBCS )) |
+ log_err("u-> ibm-1363(DBCS portion) with FallBack did not match.\n"); |
+ |
+ if(!testConvertToUnicode(expectedIBM1363_DBCS, sizeof(expectedIBM1363_DBCS), |
+ retrievedDBCSText, sizeof(retrievedDBCSText)/sizeof(retrievedDBCSText[0]),"ibm-1363", TRUE, fromIBM1363offs_DBCS )) |
+ log_err("ibm-1363->u(DBCS portion) with Fallback did not match.\n"); |
+ |
+ |
+ /*MBCS*/ |
+ if(!testConvertFromUnicode(MBCSText, sizeof(MBCSText)/sizeof(MBCSText[0]), |
+ expectedIBM950, sizeof(expectedIBM950), "ibm-950", TRUE, toIBM950Offs )) |
+ log_err("u-> ibm-950(MBCS) with FallBack did not match.\n"); |
+ |
+ if(!testConvertToUnicode(expectedIBM950, sizeof(expectedIBM950), |
+ retrievedMBCSText, sizeof(retrievedMBCSText)/sizeof(retrievedMBCSText[0]),"ibm-950", TRUE, fromIBM950offs )) |
+ log_err("ibm-950->u(MBCS) with Fallback did not match.\n"); |
+ |
+ /*commented untill data table is available*/ |
+ log_verbose("toUnicode fallback with fallback data for MBCS\n"); |
+ { |
+ const uint8_t IBM950input[] = { |
+ 0xf4, 0x87, 0xa4, 0x4a, 0xf4, 0x88, 0xa4, 0x4b, |
+ 0xf9, 0x92, 0xdc, 0xb0, }; |
+ UChar expectedUnicodeText[]= { 0x5165, 0x5165, 0x516b, 0x516b, 0x9ef9, 0x9ef9}; |
+ int32_t fromIBM950inputOffs [] = { 0, 2, 4, 6, 8, 10}; |
+ /* for testing reverse fallback behavior */ |
+ UChar expectedFallbackFalse[]= { 0x5165, 0x5165, 0x516b, 0x516b, 0x9ef9, 0x9ef9}; |
+ |
+ if(!testConvertToUnicode(IBM950input, sizeof(IBM950input), |
+ expectedUnicodeText, sizeof(expectedUnicodeText)/sizeof(expectedUnicodeText[0]),"ibm-950", TRUE, fromIBM950inputOffs )) |
+ log_err("ibm-950->u(MBCS) with Fallback did not match.\n"); |
+ if(!testConvertToUnicode(IBM950input, sizeof(IBM950input), |
+ expectedFallbackFalse, sizeof(expectedFallbackFalse)/sizeof(expectedFallbackFalse[0]),"ibm-950", FALSE, fromIBM950inputOffs )) |
+ log_err("ibm-950->u(MBCS) with Fallback did not match.\n"); |
+ |
+ } |
+ log_verbose("toUnicode fallback with fallback data for euc-tw\n"); |
+ { |
+ const uint8_t euc_tw_input[] = { |
+ 0xA7, 0xCC, 0x8E, 0xA2, 0xA1, 0xAB, |
+ 0xA8, 0xC7, 0xC8, 0xDE, |
+ 0xA8, 0xCD, 0x8E, 0xA2, 0xA2, 0xEA,}; |
+ UChar expectedUnicodeText[]= { 0x5C6E, 0x5C6E, 0x81FC, 0x81FC, 0x8278, 0x8278}; |
+ int32_t from_euc_tw_offs [] = { 0, 2, 6, 8, 10, 12}; |
+ /* for testing reverse fallback behavior */ |
+ UChar expectedFallbackFalse[]= { 0x5C6E, 0x5C6E, 0x81FC, 0x81FC, 0x8278, 0x8278}; |
+ |
+ if(!testConvertToUnicode(euc_tw_input, sizeof(euc_tw_input), |
+ expectedUnicodeText, sizeof(expectedUnicodeText)/sizeof(expectedUnicodeText[0]),"euc-tw", TRUE, from_euc_tw_offs )) |
+ log_err("from euc-tw->u with Fallback did not match.\n"); |
+ |
+ if(!testConvertToUnicode(euc_tw_input, sizeof(euc_tw_input), |
+ expectedFallbackFalse, sizeof(expectedFallbackFalse)/sizeof(expectedFallbackFalse[0]),"euc-tw", FALSE, from_euc_tw_offs )) |
+ log_err("from euc-tw->u with Fallback false did not match.\n"); |
+ |
+ |
+ } |
+ log_verbose("fromUnicode to euc-tw with fallback data euc-tw\n"); |
+ { |
+ UChar inputText[]= { 0x0001, 0x008e, 0x203e, 0x2223, 0xff5c, 0x5296, |
+ 0x5C6E, 0x5C6E, 0x81FC, 0x81FC, 0x8278, 0x8278, 0xEDEC}; |
+ const uint8_t expected_euc_tw[] = { |
+ 0x01, 0x1a, 0xa2, 0xa3, |
+ 0xa2, 0xde, 0xa2, 0xde, |
+ 0x8e, 0xa2, 0xe5, 0xb9, |
+ 0x8e, 0xa2, 0xa1, 0xab, 0x8e, 0xa2, 0xa1, 0xab, |
+ 0xc8, 0xde, 0xc8, 0xde, |
+ 0x8e, 0xa2, 0xa2, 0xea, 0x8e, 0xa2, 0xa2, 0xea, |
+ 0x8e, 0xac, 0xc6, 0xf7}; |
+ int32_t to_euc_tw_offs [] = { 0, 1, 2, 2, 3, 3, 4, 4, 5, 5, 5, 5, 6, 6, |
+ 6, 6, 7, 7, 7, 7, 8, 8, 9, 9, 10, 10, 10, 10, 11, 11, 11, 11, 12, 12, 12, 12}; |
+ |
+ if(!testConvertFromUnicode(inputText, sizeof(inputText)/sizeof(inputText[0]), |
+ expected_euc_tw, sizeof(expected_euc_tw), "euc-tw", TRUE, to_euc_tw_offs )) |
+ log_err("u-> euc-tw with FallBack did not match.\n"); |
+ |
+ } |
+ |
+ /*MBCS 1363*/ |
+ if(!testConvertFromUnicode(MBCSText1363, sizeof(MBCSText1363)/sizeof(MBCSText1363[0]), |
+ expectedIBM1363, sizeof(expectedIBM1363), "ibm-1363", TRUE, toIBM1363Offs )) |
+ log_err("u-> ibm-1363(MBCS) with FallBack did not match.\n"); |
+ |
+ if(!testConvertToUnicode(expectedIBM1363, sizeof(expectedIBM1363), |
+ retrievedMBCSText1363, sizeof(retrievedMBCSText1363)/sizeof(retrievedMBCSText1363[0]),"ibm-1363", TRUE, fromIBM1363offs )) |
+ log_err("ibm-1363->u(MBCS) with Fallback did not match.\n"); |
+ |
+ |
+ /*some more test to increase the code coverage in MBCS. Create an test converter from test1.ucm |
+ which is test file for MBCS conversion with single-byte codepage data.*/ |
+ { |
+ |
+ /* MBCS with single byte codepage data test1.ucm*/ |
+ const UChar unicodeInput[] = { 0x20ac, 0x0005, 0x0006, 0xdbc4, 0xde34, 0xdbba, 0xdfcd, 0x0003}; |
+ const uint8_t expectedtest1[] = { 0x00, 0x05, 0xff, 0x07, 0x08, 0xff,}; |
+ int32_t totest1Offs[] = { 0, 1, 2, 3, 5, 7}; |
+ |
+ const uint8_t test1input[] = { 0x00, 0x05, 0x06, 0x07, 0x08, 0x09}; |
+ const UChar expectedUnicode[] = { 0x20ac, 0x0005, 0x0006, 0xdbc4, 0xde34, 0xfffd, 0xfffd, 0xfffe}; |
+ int32_t fromtest1Offs[] = { 0, 1, 2, 3, 3, 4,5}; |
+ |
+ /*from Unicode*/ |
+ if(!testConvertFromUnicode(unicodeInput, sizeof(unicodeInput)/sizeof(unicodeInput[0]), |
+ expectedtest1, sizeof(expectedtest1), "@test1", TRUE, totest1Offs )) |
+ log_err("u-> test1(MBCS conversion with single-byte) did not match.\n"); |
+ |
+ /*to Unicode*/ |
+ if(!testConvertToUnicode(test1input, sizeof(test1input), |
+ expectedUnicode, sizeof(expectedUnicode)/sizeof(expectedUnicode[0]), "@test1", TRUE, fromtest1Offs )) |
+ log_err("test1(MBCS conversion with single-byte) -> u did not match.\n"); |
+ |
+ } |
+ |
+ /*some more test to increase the code coverage in MBCS. Create an test converter from test3.ucm |
+ which is test file for MBCS conversion with three-byte codepage data.*/ |
+ { |
+ |
+ /* MBCS with three byte codepage data test3.ucm*/ |
+ const UChar unicodeInput[] = { 0x20ac, 0x0005, 0x0006, 0xdbc4, 0xde34, 0xdbba, 0xdfcd, 0x000b, 0xd84d, 0xdc56, 0x000e, 0x0003, }; |
+ const uint8_t expectedtest3[] = { 0x00, 0x05, 0xff, 0x07, 0xff, 0x01, 0x02, 0x0b, 0x01, 0x02, 0x0a, 0xff, 0xff,}; |
+ int32_t totest3Offs[] = { 0, 1, 2, 3, 5, 7, 7, 7, 8, 8, 8, 10, 11}; |
+ |
+ const uint8_t test3input[] = { 0x00, 0x05, 0x06, 0x01, 0x02, 0x0b, 0x07, 0x01, 0x02, 0x0a, |
+ 0x01, 0x02, 0x0e, 0x01, 0x02, 0x0d, 0x03, 0x01, 0x02, 0x0f,}; |
+ const UChar expectedUnicode[] = { 0x20ac, 0x0005, 0x0006, 0x000b, 0xdbc4, 0xde34, 0xd84d, 0xdc56, |
+ 0x000e, 0xd891, 0xdd67, 0xfffd, 0xfffd }; |
+ int32_t fromtest3Offs[] = { 0, 1, 2, 3, 6, 6, 7, 7, 10, 13, 13, 16, 17}; |
+ |
+ /*from Unicode*/ |
+ if(!testConvertFromUnicode(unicodeInput, sizeof(unicodeInput)/sizeof(unicodeInput[0]), |
+ expectedtest3, sizeof(expectedtest3), "@test3", TRUE, totest3Offs )) |
+ log_err("u-> test3(MBCS conversion with three-byte) did not match.\n"); |
+ |
+ /*to Unicode*/ |
+ if(!testConvertToUnicode(test3input, sizeof(test3input), |
+ expectedUnicode, sizeof(expectedUnicode)/sizeof(expectedUnicode[0]), "@test3", TRUE, fromtest3Offs )) |
+ log_err("test3(MBCS conversion with three-byte) -> u did not match.\n"); |
+ |
+ } |
+ |
+ /*some more test to increase the code coverage in MBCS. Create an test converter from test4.ucm |
+ which is test file for MBCS conversion with four-byte codepage data.*/ |
+ { |
+ |
+ /* MBCS with three byte codepage data test4.ucm*/ |
+ const UChar unicodeInput[] = |
+ { 0x20ac, 0x0005, 0x0006, 0x000b, 0xdbc4, 0xde34, 0xdbba, 0xdfcd, |
+ 0xd84d, 0xdc56, 0x000e, 0xd891, 0xdd67, 0x000f}; |
+ const uint8_t expectedtest4[] = |
+ { 0x00, 0x05, 0xff, 0x01, 0x02, 0x03, 0x0b, 0x07, 0xff, |
+ 0x01, 0x02, 0x03, 0x0a, 0xff, 0xff, 0xff}; |
+ int32_t totest4Offs[] = |
+ { 0, 1, 2, 3, 3, 3, 3, 4, 6, 8, 8, 8, 8, 10, 11, 13}; |
+ |
+ const uint8_t test4input[] = |
+ { 0x00, 0x05, 0x06, 0x01, 0x02, 0x03, 0x0b, 0x07, 0x08, |
+ 0x01, 0x02, 0x03, 0x0a, 0x01, 0x02, 0x03, 0x0e, 0x01, 0x02, 0x03, 0x0d, 0x03, 0x01, 0x02, 0x03, 0x0c,}; |
+ const UChar expectedUnicode[] = |
+ { 0x20ac, 0x0005, 0x0006, 0x000b, 0xdbc4, 0xde34, 0xdbba, 0xdfcd, |
+ 0xd84d, 0xdc56, 0x000e, 0xd891, 0xdd67, 0x1a, 0xfffd}; |
+ int32_t fromtest4Offs[] = |
+ { 0, 1, 2, 3, 7, 7, 8, 8, 9, 9, 13, 17, 17, 21, 22,}; |
+ |
+ /*from Unicode*/ |
+ if(!testConvertFromUnicode(unicodeInput, sizeof(unicodeInput)/sizeof(unicodeInput[0]), |
+ expectedtest4, sizeof(expectedtest4), "@test4", TRUE, totest4Offs )) |
+ log_err("u-> test4(MBCS conversion with four-byte) did not match.\n"); |
+ |
+ /*to Unicode*/ |
+ if(!testConvertToUnicode(test4input, sizeof(test4input), |
+ expectedUnicode, sizeof(expectedUnicode)/sizeof(expectedUnicode[0]), "@test4", TRUE, fromtest4Offs )) |
+ log_err("test4(MBCS conversion with four-byte) -> u did not match.\n"); |
+ |
+ } |
+ /* Test for jitterbug 509 EBCDIC_STATEFUL Converters*/ |
+ { |
+ const UChar unicodeInput[] = {0x00AF, 0x2013, 0x2223, 0x004C, 0x5F5D, 0xFF5E }; |
+ const uint8_t expectedtest1[] = {0x0E,0x42,0xA1, 0x44,0x4A, 0x42,0x4F, 0x0F,0xD3, 0x0E,0x65,0x60, 0x43,0xA1,0x0f }; |
+ int32_t totest1Offs[] = {0, 0, 0, 1, 1, 2, 2, 3, 3, 4, 4, 4, 5, 5, 5 }; |
+ const uint8_t test1input[] = {0x0E,0x42,0xA1, 0x44,0x4A, 0x42,0x4F, 0x0F,0xD3, 0x0E,0x65,0x60, 0x43,0xA1 }; |
+ const UChar expectedUnicode[] = {0x203e, 0x2014, 0xff5c, 0x004c, 0x5f5e, 0x223c }; |
+ int32_t fromtest1Offs[] = {1, 3, 5, 8, 10, 12 }; |
+ /*from Unicode*/ |
+ if(!testConvertFromUnicode(unicodeInput, sizeof(unicodeInput)/sizeof(unicodeInput[0]), |
+ expectedtest1, sizeof(expectedtest1), "ibm-1371", TRUE, totest1Offs )) |
+ log_err("u-> ibm-1371(MBCS conversion with single-byte) did not match.,\n"); |
+ /*to Unicode*/ |
+ if(!testConvertToUnicode(test1input, sizeof(test1input), |
+ expectedUnicode, sizeof(expectedUnicode)/sizeof(expectedUnicode[0]), "ibm-1371", TRUE, fromtest1Offs )) |
+ log_err("ibm-1371(MBCS conversion with single-byte) -> u did not match.,\n"); |
+ } |
+ |
+} |
+#else |
+void addTestConverterFallBack(TestNode** root) |
+{ |
+ /* test nothing... */ |
+ |
+} |
+#endif |
Property changes on: icu46/source/test/cintltst/ncnvfbts.c |
___________________________________________________________________ |
Added: svn:eol-style |
+ LF |