242e02c388
X-SVN-Rev: 39583
754 lines
28 KiB
C
754 lines
28 KiB
C
// © 2016 and later: Unicode, Inc. and others.
|
|
// License & terms of use: http://www.unicode.org/copyright.html
|
|
/********************************************************************
|
|
* COPYRIGHT:
|
|
* Copyright (c) 1997-2016, International Business Machines Corporation and
|
|
* others. All Rights Reserved.
|
|
***************************************************************************/
|
|
/*****************************************************************************
|
|
*
|
|
* File NCNVCBTS
|
|
*
|
|
* Modification History:
|
|
* Name Date Description
|
|
* Madhu Katragadda 06/23/2000 Tests for Conveter FallBack API and Functionality
|
|
******************************************************************************
|
|
*/
|
|
#include <stdio.h>
|
|
#include "unicode/uloc.h"
|
|
#include "unicode/ucnv.h"
|
|
#include "unicode/ucnv_err.h"
|
|
#include "cintltst.h"
|
|
#include "unicode/utypes.h"
|
|
#include "unicode/ustring.h"
|
|
#include "ncnvfbts.h"
|
|
#include "cmemory.h"
|
|
#include "cstring.h"
|
|
|
|
#if !UCONFIG_NO_LEGACY_CONVERSION
|
|
#define NEW_MAX_BUFFER 999
|
|
|
|
|
|
#define nct_min(x,y) ((x<y) ? x : y)
|
|
|
|
static int32_t gInBufferSize = 0;
|
|
static int32_t gOutBufferSize = 0;
|
|
static char gNuConvTestName[1024];
|
|
|
|
static UConverter *my_ucnv_open(const char *cnv, UErrorCode *err)
|
|
{
|
|
if(cnv && cnv[0] == '@') {
|
|
return ucnv_openPackage("testdata", cnv+1, err);
|
|
} else {
|
|
return ucnv_open(cnv, err);
|
|
}
|
|
}
|
|
|
|
|
|
static void printSeq(const unsigned char* a, int len)
|
|
{
|
|
int i=0;
|
|
log_verbose("{");
|
|
while (i<len)
|
|
log_verbose("0x%02x ", a[i++]);
|
|
log_verbose("}\n");
|
|
}
|
|
|
|
static void printUSeq(const UChar* a, int len)
|
|
{
|
|
int i=0;
|
|
log_verbose("{U+");
|
|
while (i<len)
|
|
log_verbose("0x%04x ", a[i++]);
|
|
log_verbose("}\n");
|
|
}
|
|
|
|
static void printSeqErr(const unsigned char* a, int len)
|
|
{
|
|
int i=0;
|
|
fprintf(stderr, "{");
|
|
while (i<len)
|
|
fprintf(stderr, "0x%02x ", a[i++]);
|
|
fprintf(stderr, "}\n");
|
|
}
|
|
|
|
static void printUSeqErr(const UChar* a, int len)
|
|
{
|
|
int i=0;
|
|
fprintf(stderr, "{U+");
|
|
while (i<len)
|
|
fprintf(stderr, "0x%04x ", a[i++]);
|
|
fprintf(stderr,"}\n");
|
|
}
|
|
|
|
static void TestConverterFallBack(void)
|
|
{
|
|
TestConvertFallBackWithBufferSizes(10,10);
|
|
TestConvertFallBackWithBufferSizes(2,3);
|
|
TestConvertFallBackWithBufferSizes(3,2);
|
|
TestConvertFallBackWithBufferSizes(NEW_MAX_BUFFER,1);
|
|
TestConvertFallBackWithBufferSizes(NEW_MAX_BUFFER,2);
|
|
TestConvertFallBackWithBufferSizes(NEW_MAX_BUFFER,3);
|
|
TestConvertFallBackWithBufferSizes(NEW_MAX_BUFFER,4);
|
|
TestConvertFallBackWithBufferSizes(NEW_MAX_BUFFER,5);
|
|
TestConvertFallBackWithBufferSizes(NEW_MAX_BUFFER,6);
|
|
TestConvertFallBackWithBufferSizes(1,NEW_MAX_BUFFER);
|
|
TestConvertFallBackWithBufferSizes(2,NEW_MAX_BUFFER);
|
|
TestConvertFallBackWithBufferSizes(3,NEW_MAX_BUFFER);
|
|
TestConvertFallBackWithBufferSizes(4,NEW_MAX_BUFFER);
|
|
TestConvertFallBackWithBufferSizes(5,NEW_MAX_BUFFER);
|
|
TestConvertFallBackWithBufferSizes(NEW_MAX_BUFFER,NEW_MAX_BUFFER);
|
|
|
|
}
|
|
|
|
|
|
void addTestConverterFallBack(TestNode** root);
|
|
|
|
void addTestConverterFallBack(TestNode** root)
|
|
{
|
|
#if !UCONFIG_NO_FILE_IO
|
|
addTest(root, &TestConverterFallBack, "tsconv/ncnvfbts/TestConverterFallBack");
|
|
#endif
|
|
|
|
}
|
|
|
|
|
|
/* Note that this test already makes use of statics, so it's not really
|
|
multithread safe.
|
|
This convenience function lets us make the error messages actually useful.
|
|
*/
|
|
|
|
static void setNuConvTestName(const char *codepage, const char *direction)
|
|
{
|
|
sprintf(gNuConvTestName, "[Testing %s %s Unicode, InputBufSiz=%d, OutputBufSiz=%d]",
|
|
codepage,
|
|
direction,
|
|
(int)gInBufferSize,
|
|
(int)gOutBufferSize);
|
|
}
|
|
|
|
|
|
static UBool testConvertFromUnicode(const UChar *source, int sourceLen, const uint8_t *expect, int expectLen,
|
|
const char *codepage, UBool fallback, const int32_t *expectOffsets)
|
|
{
|
|
|
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
UConverter *conv = 0;
|
|
char junkout[NEW_MAX_BUFFER]; /* FIX */
|
|
int32_t junokout[NEW_MAX_BUFFER]; /* FIX */
|
|
const UChar *src;
|
|
char *end;
|
|
char *targ;
|
|
int32_t *offs;
|
|
int i;
|
|
int32_t realBufferSize;
|
|
char *realBufferEnd;
|
|
const UChar *realSourceEnd;
|
|
const UChar *sourceLimit;
|
|
UBool checkOffsets = TRUE;
|
|
UBool doFlush;
|
|
UBool action=FALSE;
|
|
char *p;
|
|
|
|
|
|
for(i=0;i<NEW_MAX_BUFFER;i++)
|
|
junkout[i] = (char)0xF0;
|
|
for(i=0;i<NEW_MAX_BUFFER;i++)
|
|
junokout[i] = 0xFF;
|
|
setNuConvTestName(codepage, "FROM");
|
|
|
|
log_verbose("\nTesting========= %s FROM \n inputbuffer= %d outputbuffer= %d\n", codepage, gInBufferSize,
|
|
gOutBufferSize);
|
|
|
|
conv = my_ucnv_open(codepage, &status);
|
|
if(U_FAILURE(status))
|
|
{
|
|
log_data_err("Couldn't open converter %s\n",codepage);
|
|
return TRUE;
|
|
}
|
|
|
|
log_verbose("Converter opened..\n");
|
|
/*----setting the callback routine----*/
|
|
ucnv_setFallback (conv, fallback);
|
|
action = ucnv_usesFallback(conv);
|
|
if(action != fallback){
|
|
log_err("FAIL: Error is setting fallback. Errocode=%s\n", myErrorName(status));
|
|
}
|
|
/*------------------------*/
|
|
src = source;
|
|
targ = junkout;
|
|
offs = junokout;
|
|
|
|
realBufferSize = UPRV_LENGTHOF(junkout);
|
|
realBufferEnd = junkout + realBufferSize;
|
|
realSourceEnd = source + sourceLen;
|
|
|
|
if ( gOutBufferSize != realBufferSize )
|
|
checkOffsets = FALSE;
|
|
|
|
if( gInBufferSize != NEW_MAX_BUFFER )
|
|
checkOffsets = FALSE;
|
|
|
|
do
|
|
{
|
|
end = nct_min(targ + gOutBufferSize, realBufferEnd);
|
|
sourceLimit = nct_min(src + gInBufferSize, realSourceEnd);
|
|
|
|
doFlush = (UBool)(sourceLimit == realSourceEnd);
|
|
|
|
if(targ == realBufferEnd)
|
|
{
|
|
log_err("Error, overflowed the real buffer while about to call fromUnicode! targ=%08lx %s", targ, gNuConvTestName);
|
|
return FALSE;
|
|
}
|
|
log_verbose("calling fromUnicode @ SOURCE:%08lx to %08lx TARGET: %08lx to %08lx, flush=%s\n", src,sourceLimit, targ,end, doFlush?"TRUE":"FALSE");
|
|
|
|
|
|
status = U_ZERO_ERROR;
|
|
|
|
ucnv_fromUnicode (conv,
|
|
(char **)&targ,
|
|
(const char *)end,
|
|
&src,
|
|
sourceLimit,
|
|
checkOffsets ? offs : NULL,
|
|
doFlush, /* flush if we're at the end of the input data */
|
|
&status);
|
|
|
|
} while ( (status == U_BUFFER_OVERFLOW_ERROR) || (sourceLimit < realSourceEnd) );
|
|
|
|
if(U_FAILURE(status))
|
|
{
|
|
log_err("Problem doing toUnicode, errcode %d %s\n", myErrorName(status), gNuConvTestName);
|
|
return FALSE;
|
|
}
|
|
|
|
log_verbose("\nConversion done [%d uchars in -> %d chars out]. \nResult :",
|
|
sourceLen, targ-junkout);
|
|
if(getTestOption(VERBOSITY_OPTION))
|
|
{
|
|
char junk[9999];
|
|
char offset_str[9999];
|
|
|
|
junk[0] = 0;
|
|
offset_str[0] = 0;
|
|
for(p = junkout;p<targ;p++)
|
|
{
|
|
sprintf(junk + uprv_strlen(junk), "0x%02x, ", (0xFF) & (unsigned int)*p);
|
|
sprintf(offset_str + strlen(offset_str), "0x%02x, ", (0xFF) & (unsigned int)junokout[p-junkout]);
|
|
}
|
|
|
|
log_verbose(junk);
|
|
printSeq((const unsigned char*)expect, expectLen);
|
|
if ( checkOffsets )
|
|
{
|
|
log_verbose("\nOffsets:");
|
|
log_verbose(offset_str);
|
|
}
|
|
log_verbose("\n");
|
|
}
|
|
ucnv_close(conv);
|
|
|
|
|
|
if(expectLen != targ-junkout)
|
|
{
|
|
log_err("Expected %d chars out, got %d %s\n", expectLen, targ-junkout, gNuConvTestName);
|
|
log_verbose("Expected %d chars out, got %d %s\n", expectLen, targ-junkout, gNuConvTestName);
|
|
printSeqErr((const unsigned char*)junkout, (int32_t)(targ-junkout));
|
|
printSeqErr((const unsigned char*)expect, expectLen);
|
|
return FALSE;
|
|
}
|
|
|
|
if (checkOffsets && (expectOffsets != 0) )
|
|
{
|
|
log_verbose("\ncomparing %d offsets..\n", targ-junkout);
|
|
if(uprv_memcmp(junokout,expectOffsets,(targ-junkout) * sizeof(int32_t) )){
|
|
log_err("\ndid not get the expected offsets while %s \n", gNuConvTestName);
|
|
log_err("Got : ");
|
|
printSeqErr((const unsigned char*)junkout, (int32_t)(targ-junkout));
|
|
for(p=junkout;p<targ;p++)
|
|
log_err("%d, ", junokout[p-junkout]);
|
|
log_err("\nExpected: ");
|
|
for(i=0; i<(targ-junkout); i++)
|
|
log_err("%d,", expectOffsets[i]);
|
|
}
|
|
}
|
|
|
|
log_verbose("\n\ncomparing..\n");
|
|
if(!memcmp(junkout, expect, expectLen))
|
|
{
|
|
log_verbose("Matches!\n");
|
|
return TRUE;
|
|
}
|
|
else
|
|
{
|
|
log_err("String does not match. %s\n", gNuConvTestName);
|
|
log_verbose("String does not match. %s\n", gNuConvTestName);
|
|
printSeqErr((const unsigned char*)junkout, expectLen);
|
|
printSeqErr((const unsigned char*)expect, expectLen);
|
|
return FALSE;
|
|
}
|
|
}
|
|
|
|
static UBool testConvertToUnicode( const uint8_t *source, int sourcelen, const UChar *expect, int expectlen,
|
|
const char *codepage, UBool fallback, const int32_t *expectOffsets)
|
|
{
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
UConverter *conv = 0;
|
|
UChar junkout[NEW_MAX_BUFFER]; /* FIX */
|
|
int32_t junokout[NEW_MAX_BUFFER]; /* FIX */
|
|
const char *src;
|
|
const char *realSourceEnd;
|
|
const char *srcLimit;
|
|
UChar *targ;
|
|
UChar *end;
|
|
int32_t *offs;
|
|
int i;
|
|
UBool checkOffsets = TRUE;
|
|
char junk[9999];
|
|
char offset_str[9999];
|
|
UChar *p;
|
|
UBool action;
|
|
|
|
int32_t realBufferSize;
|
|
UChar *realBufferEnd;
|
|
|
|
|
|
for(i=0;i<NEW_MAX_BUFFER;i++)
|
|
junkout[i] = 0xFFFE;
|
|
|
|
for(i=0;i<NEW_MAX_BUFFER;i++)
|
|
junokout[i] = -1;
|
|
|
|
setNuConvTestName(codepage, "TO");
|
|
|
|
log_verbose("\n========= %s\n", gNuConvTestName);
|
|
|
|
conv = my_ucnv_open(codepage, &status);
|
|
if(U_FAILURE(status))
|
|
{
|
|
log_data_err("Couldn't open converter %s\n",gNuConvTestName);
|
|
return TRUE; /* because it has been logged */
|
|
}
|
|
|
|
log_verbose("Converter opened..\n");
|
|
|
|
src = (const char *)source;
|
|
targ = junkout;
|
|
offs = junokout;
|
|
|
|
realBufferSize = UPRV_LENGTHOF(junkout);
|
|
realBufferEnd = junkout + realBufferSize;
|
|
realSourceEnd = src + sourcelen;
|
|
/*----setting the fallback routine----*/
|
|
ucnv_setFallback (conv, fallback);
|
|
action = ucnv_usesFallback(conv);
|
|
if(action != fallback){
|
|
log_err("FAIL: Error is setting fallback. Errocode=%s\n", myErrorName(status));
|
|
}
|
|
/*-------------------------------------*/
|
|
if ( gOutBufferSize != realBufferSize )
|
|
checkOffsets = FALSE;
|
|
|
|
if( gInBufferSize != NEW_MAX_BUFFER )
|
|
checkOffsets = FALSE;
|
|
|
|
do
|
|
{
|
|
end = nct_min( targ + gOutBufferSize, realBufferEnd);
|
|
srcLimit = nct_min(realSourceEnd, src + gInBufferSize);
|
|
|
|
if(targ == realBufferEnd)
|
|
{
|
|
log_err("Error, the end would overflow the real output buffer while about to call toUnicode! tarjey=%08lx %s",targ,gNuConvTestName);
|
|
return FALSE;
|
|
}
|
|
log_verbose("calling toUnicode @ %08lx to %08lx\n", targ,end);
|
|
|
|
|
|
|
|
status = U_ZERO_ERROR;
|
|
|
|
ucnv_toUnicode (conv,
|
|
&targ,
|
|
end,
|
|
(const char **)&src,
|
|
(const char *)srcLimit,
|
|
checkOffsets ? offs : NULL,
|
|
(UBool)(srcLimit == realSourceEnd), /* flush if we're at the end of hte source data */
|
|
&status);
|
|
} while ( (status == U_BUFFER_OVERFLOW_ERROR) || (srcLimit < realSourceEnd) ); /* while we just need another buffer */
|
|
|
|
|
|
if(U_FAILURE(status))
|
|
{
|
|
log_err("Problem doing toUnicode, errcode %s %s\n", myErrorName(status), gNuConvTestName);
|
|
return FALSE;
|
|
}
|
|
|
|
log_verbose("\nConversion done. %d bytes -> %d chars.\nResult :",
|
|
sourcelen, targ-junkout);
|
|
if(getTestOption(VERBOSITY_OPTION))
|
|
{
|
|
|
|
junk[0] = 0;
|
|
offset_str[0] = 0;
|
|
|
|
for(p = junkout;p<targ;p++)
|
|
{
|
|
sprintf(junk + strlen(junk), "0x%04x, ", (0xFFFF) & (unsigned int)*p);
|
|
sprintf(offset_str + strlen(offset_str), "0x%04x, ", (0xFFFF) & (unsigned int)junokout[p-junkout]);
|
|
}
|
|
|
|
log_verbose(junk);
|
|
printUSeq(expect, expectlen);
|
|
if ( checkOffsets )
|
|
{
|
|
log_verbose("\nOffsets:");
|
|
log_verbose(offset_str);
|
|
}
|
|
log_verbose("\n");
|
|
}
|
|
ucnv_close(conv);
|
|
|
|
log_verbose("comparing %d uchars (%d bytes)..\n",expectlen,expectlen*2);
|
|
|
|
if (checkOffsets && (expectOffsets != 0))
|
|
{
|
|
if(memcmp(junokout,expectOffsets,(targ-junkout) * sizeof(int32_t)))
|
|
{
|
|
log_err("\n\ndid not get the expected offsets while %s \n", gNuConvTestName);
|
|
log_err("\nGot : ");
|
|
for(p=junkout;p<targ;p++)
|
|
log_err("%d, ", junokout[p-junkout]);
|
|
log_err("\nExpected: ");
|
|
for(i=0; i<(targ-junkout); i++)
|
|
log_err("%d,", expectOffsets[i]);
|
|
log_err("");
|
|
for(i=0; i<(targ-junkout); i++)
|
|
log_err("0x%04X,", junkout[i]);
|
|
log_err("");
|
|
for(i=0; i<(src-(const char *)source); i++)
|
|
log_err("0x%04X,", (unsigned char)source[i]);
|
|
}
|
|
}
|
|
|
|
if(!memcmp(junkout, expect, expectlen*2))
|
|
{
|
|
log_verbose("Matches!\n");
|
|
return TRUE;
|
|
}
|
|
else
|
|
{
|
|
log_err("String does not match. %s\n", gNuConvTestName);
|
|
log_verbose("String does not match. %s\n", gNuConvTestName);
|
|
printUSeqErr(junkout, expectlen);
|
|
printf("\n");
|
|
printUSeqErr(expect, expectlen);
|
|
return FALSE;
|
|
}
|
|
}
|
|
|
|
|
|
|
|
static void TestConvertFallBackWithBufferSizes(int32_t outsize, int32_t insize )
|
|
{
|
|
|
|
static const UChar SBCSText[] =
|
|
{ 0x0021, 0xFF01, 0x0022, 0xFF02, 0x0023, 0xFF03, 0x003A, 0xFF1A, 0x003B, 0xFF1B, 0x003C, 0xFF1C };
|
|
/* 21, ?, 22, ?, 23, ?, 3a, ?, 3b, ?, 3c, ? SBCS*/
|
|
static const uint8_t expectedNative[] =
|
|
{ 0x21, 0x21, 0x22, 0x22, 0x23, 0x23, 0x3a, 0x3a, 0x3b, 0x3b, 0x3c, 0x3c};
|
|
static const UChar retrievedSBCSText[]=
|
|
{ 0x0021, 0x0021, 0x0022, 0x0022, 0x0023, 0x0023, 0x003A, 0x003A, 0x003B, 0x003B, 0x003C, 0x003C };
|
|
static const int32_t toNativeOffs [] =
|
|
{ 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, 0x08, 0x09, 0x0a, 0x0b};
|
|
static const int32_t fromNativeoffs [] =
|
|
{ 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11};
|
|
|
|
|
|
/* 1363 isn't DBCS, but it has the DBCS section */
|
|
static const UChar DBCSText[] =
|
|
{ 0x00a1, 0x00ad, 0x2010, 0x00b7, 0x30fb};
|
|
static const uint8_t expectedIBM1363_DBCS[] =
|
|
{ 0xa2, 0xae, 0xa1 ,0xa9, 0xa1, 0xa9,0xa1 ,0xa4, 0xa1, 0xa4};
|
|
static const UChar retrievedDBCSText[]=
|
|
{ 0x00a1, 0x2010, 0x2010, 0x30fb, 0x30fb };
|
|
static const int32_t toIBM1363Offs_DBCS[] =
|
|
{ 0x00, 0x00, 0x01,0x01, 0x02, 0x02, 0x03, 0x03, 0x04, 0x04};
|
|
static const int32_t fromIBM1363offs_DBCS[] =
|
|
{ 0, 2, 4, 6, 8};
|
|
|
|
|
|
static const UChar MBCSText[] =
|
|
{ 0x0001, 0x263a, 0x2013, 0x2014, 0x263b, 0x0002};
|
|
static const uint8_t expectedIBM950[] =
|
|
{ 0x01, 0x01, 0xa1, 0x56, 0xa1, 0x56, 0x02, 0x02};
|
|
static const UChar retrievedMBCSText[]=
|
|
{ 0x0001, 0x0001, 0x2014, 0x2014, 0x0002, 0x0002};
|
|
static const int32_t toIBM950Offs [] =
|
|
{ 0x00, 0x01, 0x02, 0x02, 0x03, 0x03, 0x04, 0x05};
|
|
static const int32_t fromIBM950offs [] =
|
|
{ 0, 1, 2, 4, 6, 7};
|
|
|
|
static const UChar MBCSText1363[] =
|
|
{ 0x0005,
|
|
0xffe8,
|
|
0x0007,
|
|
0x2022,
|
|
0x005c,
|
|
0x00b7,
|
|
0x3016,
|
|
0x30fb,
|
|
0x9a36};
|
|
static const uint8_t expectedIBM1363[] =
|
|
{ 0x05,
|
|
0x05,
|
|
0x07,
|
|
0x07,
|
|
0x7f,
|
|
0xa1, 0xa4,
|
|
0xa1, 0xe0,
|
|
0xa1, 0xa4,
|
|
0xf5, 0xe2};
|
|
static const UChar retrievedMBCSText1363[]=
|
|
{ 0x0005, 0x0005, 0x0007, 0x0007, 0x001a, 0x30fb, 0x25a1, 0x30fb, 0x9a36};
|
|
static const int32_t toIBM1363Offs [] =
|
|
{ 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x05, 0x06, 0x06, 0x07, 0x07, 0x08, 0x08};
|
|
static const int32_t fromIBM1363offs [] =
|
|
{ 0, 1, 2, 3, 4, 5, 7, 9, 11};
|
|
|
|
|
|
|
|
static const char* nativeCodePage[]={
|
|
/*NLCS Mapping*/
|
|
"ibm-437",
|
|
"ibm-850",
|
|
"ibm-878",
|
|
"ibm-923",
|
|
"ibm-1051",
|
|
"ibm-1089",
|
|
"ibm-1250",
|
|
"ibm-1251",
|
|
"ibm-1253",
|
|
"ibm-1254",
|
|
"ibm-1255",
|
|
"ibm-1256",
|
|
"ibm-1257",
|
|
"ibm-1258",
|
|
"ibm-1276"
|
|
};
|
|
|
|
int32_t i=0;
|
|
gInBufferSize = insize;
|
|
gOutBufferSize = outsize;
|
|
|
|
for(i=0; i<UPRV_LENGTHOF(nativeCodePage); i++){
|
|
log_verbose("Testing %s\n", nativeCodePage[i]);
|
|
if(!testConvertFromUnicode(SBCSText, UPRV_LENGTHOF(SBCSText),
|
|
expectedNative, sizeof(expectedNative), nativeCodePage[i], TRUE, toNativeOffs ))
|
|
log_err("u-> %s(SBCS) with FallBack did not match.\n", nativeCodePage[i]);
|
|
|
|
if(!testConvertToUnicode(expectedNative, sizeof(expectedNative),
|
|
retrievedSBCSText, UPRV_LENGTHOF(retrievedSBCSText), nativeCodePage[i], TRUE, fromNativeoffs ))
|
|
log_err("%s->u(SBCS) with Fallback did not match.\n", nativeCodePage[i]);
|
|
}
|
|
|
|
/*DBCS*/
|
|
if(!testConvertFromUnicode(DBCSText, UPRV_LENGTHOF(DBCSText),
|
|
expectedIBM1363_DBCS, sizeof(expectedIBM1363_DBCS), "ibm-1363", TRUE, toIBM1363Offs_DBCS ))
|
|
log_err("u-> ibm-1363(DBCS portion) with FallBack did not match.\n");
|
|
|
|
if(!testConvertToUnicode(expectedIBM1363_DBCS, sizeof(expectedIBM1363_DBCS),
|
|
retrievedDBCSText, UPRV_LENGTHOF(retrievedDBCSText),"ibm-1363", TRUE, fromIBM1363offs_DBCS ))
|
|
log_err("ibm-1363->u(DBCS portion) with Fallback did not match.\n");
|
|
|
|
|
|
/*MBCS*/
|
|
if(!testConvertFromUnicode(MBCSText, UPRV_LENGTHOF(MBCSText),
|
|
expectedIBM950, sizeof(expectedIBM950), "ibm-950", TRUE, toIBM950Offs ))
|
|
log_err("u-> ibm-950(MBCS) with FallBack did not match.\n");
|
|
|
|
if(!testConvertToUnicode(expectedIBM950, sizeof(expectedIBM950),
|
|
retrievedMBCSText, UPRV_LENGTHOF(retrievedMBCSText),"ibm-950", TRUE, fromIBM950offs ))
|
|
log_err("ibm-950->u(MBCS) with Fallback did not match.\n");
|
|
|
|
/*commented untill data table is available*/
|
|
log_verbose("toUnicode fallback with fallback data for MBCS\n");
|
|
{
|
|
const uint8_t IBM950input[] = {
|
|
0xf4, 0x87, 0xa4, 0x4a, 0xf4, 0x88, 0xa4, 0x4b,
|
|
0xf9, 0x92, 0xdc, 0xb0, };
|
|
UChar expectedUnicodeText[]= { 0x5165, 0x5165, 0x516b, 0x516b, 0x9ef9, 0x9ef9};
|
|
int32_t fromIBM950inputOffs [] = { 0, 2, 4, 6, 8, 10};
|
|
/* for testing reverse fallback behavior */
|
|
UChar expectedFallbackFalse[]= { 0x5165, 0x5165, 0x516b, 0x516b, 0x9ef9, 0x9ef9};
|
|
|
|
if(!testConvertToUnicode(IBM950input, sizeof(IBM950input),
|
|
expectedUnicodeText, UPRV_LENGTHOF(expectedUnicodeText),"ibm-950", TRUE, fromIBM950inputOffs ))
|
|
log_err("ibm-950->u(MBCS) with Fallback did not match.\n");
|
|
if(!testConvertToUnicode(IBM950input, sizeof(IBM950input),
|
|
expectedFallbackFalse, UPRV_LENGTHOF(expectedFallbackFalse),"ibm-950", FALSE, fromIBM950inputOffs ))
|
|
log_err("ibm-950->u(MBCS) with Fallback did not match.\n");
|
|
|
|
}
|
|
log_verbose("toUnicode fallback with fallback data for euc-tw\n");
|
|
{
|
|
const uint8_t euc_tw_input[] = {
|
|
0xA7, 0xCC, 0x8E, 0xA2, 0xA1, 0xAB,
|
|
0xA8, 0xC7, 0xC8, 0xDE,
|
|
0xA8, 0xCD, 0x8E, 0xA2, 0xA2, 0xEA,};
|
|
UChar expectedUnicodeText[]= { 0x5C6E, 0x5C6E, 0x81FC, 0x81FC, 0x8278, 0x8278};
|
|
int32_t from_euc_tw_offs [] = { 0, 2, 6, 8, 10, 12};
|
|
/* for testing reverse fallback behavior */
|
|
UChar expectedFallbackFalse[]= { 0x5C6E, 0x5C6E, 0x81FC, 0x81FC, 0x8278, 0x8278};
|
|
|
|
if(!testConvertToUnicode(euc_tw_input, sizeof(euc_tw_input),
|
|
expectedUnicodeText, UPRV_LENGTHOF(expectedUnicodeText),"euc-tw", TRUE, from_euc_tw_offs ))
|
|
log_err("from euc-tw->u with Fallback did not match.\n");
|
|
|
|
if(!testConvertToUnicode(euc_tw_input, sizeof(euc_tw_input),
|
|
expectedFallbackFalse, UPRV_LENGTHOF(expectedFallbackFalse),"euc-tw", FALSE, from_euc_tw_offs ))
|
|
log_err("from euc-tw->u with Fallback false did not match.\n");
|
|
|
|
|
|
}
|
|
log_verbose("fromUnicode to euc-tw with fallback data euc-tw\n");
|
|
{
|
|
UChar inputText[]= { 0x0001, 0x008e, 0x203e, 0x2223, 0xff5c, 0x5296,
|
|
0x5C6E, 0x5C6E, 0x81FC, 0x81FC, 0x8278, 0x8278, 0xEDEC};
|
|
const uint8_t expected_euc_tw[] = {
|
|
0x01, 0x1a, 0xa2, 0xa3,
|
|
0xa2, 0xde, 0xa2, 0xde,
|
|
0x8e, 0xa2, 0xe5, 0xb9,
|
|
0x8e, 0xa2, 0xa1, 0xab, 0x8e, 0xa2, 0xa1, 0xab,
|
|
0xc8, 0xde, 0xc8, 0xde,
|
|
0x8e, 0xa2, 0xa2, 0xea, 0x8e, 0xa2, 0xa2, 0xea,
|
|
0x8e, 0xac, 0xc6, 0xf7};
|
|
int32_t to_euc_tw_offs [] = { 0, 1, 2, 2, 3, 3, 4, 4, 5, 5, 5, 5, 6, 6,
|
|
6, 6, 7, 7, 7, 7, 8, 8, 9, 9, 10, 10, 10, 10, 11, 11, 11, 11, 12, 12, 12, 12};
|
|
|
|
if(!testConvertFromUnicode(inputText, UPRV_LENGTHOF(inputText),
|
|
expected_euc_tw, sizeof(expected_euc_tw), "euc-tw", TRUE, to_euc_tw_offs ))
|
|
log_err("u-> euc-tw with FallBack did not match.\n");
|
|
|
|
}
|
|
|
|
/*MBCS 1363*/
|
|
if(!testConvertFromUnicode(MBCSText1363, UPRV_LENGTHOF(MBCSText1363),
|
|
expectedIBM1363, sizeof(expectedIBM1363), "ibm-1363", TRUE, toIBM1363Offs ))
|
|
log_err("u-> ibm-1363(MBCS) with FallBack did not match.\n");
|
|
|
|
if(!testConvertToUnicode(expectedIBM1363, sizeof(expectedIBM1363),
|
|
retrievedMBCSText1363, UPRV_LENGTHOF(retrievedMBCSText1363),"ibm-1363", TRUE, fromIBM1363offs ))
|
|
log_err("ibm-1363->u(MBCS) with Fallback did not match.\n");
|
|
|
|
|
|
/*some more test to increase the code coverage in MBCS. Create an test converter from test1.ucm
|
|
which is test file for MBCS conversion with single-byte codepage data.*/
|
|
{
|
|
|
|
/* MBCS with single byte codepage data test1.ucm*/
|
|
const UChar unicodeInput[] = { 0x20ac, 0x0005, 0x0006, 0xdbc4, 0xde34, 0xdbba, 0xdfcd, 0x0003};
|
|
const uint8_t expectedtest1[] = { 0x00, 0x05, 0xff, 0x07, 0x08, 0xff,};
|
|
int32_t totest1Offs[] = { 0, 1, 2, 3, 5, 7};
|
|
|
|
const uint8_t test1input[] = { 0x00, 0x05, 0x06, 0x07, 0x08, 0x09};
|
|
const UChar expectedUnicode[] = { 0x20ac, 0x0005, 0x0006, 0xdbc4, 0xde34, 0xfffd, 0xfffd, 0xfffe};
|
|
int32_t fromtest1Offs[] = { 0, 1, 2, 3, 3, 4,5};
|
|
|
|
/*from Unicode*/
|
|
if(!testConvertFromUnicode(unicodeInput, UPRV_LENGTHOF(unicodeInput),
|
|
expectedtest1, sizeof(expectedtest1), "@test1", TRUE, totest1Offs ))
|
|
log_err("u-> test1(MBCS conversion with single-byte) did not match.\n");
|
|
|
|
/*to Unicode*/
|
|
if(!testConvertToUnicode(test1input, sizeof(test1input),
|
|
expectedUnicode, UPRV_LENGTHOF(expectedUnicode), "@test1", TRUE, fromtest1Offs ))
|
|
log_err("test1(MBCS conversion with single-byte) -> u did not match.\n");
|
|
|
|
}
|
|
|
|
/*some more test to increase the code coverage in MBCS. Create an test converter from test3.ucm
|
|
which is test file for MBCS conversion with three-byte codepage data.*/
|
|
{
|
|
|
|
/* MBCS with three byte codepage data test3.ucm*/
|
|
const UChar unicodeInput[] = { 0x20ac, 0x0005, 0x0006, 0xdbc4, 0xde34, 0xdbba, 0xdfcd, 0x000b, 0xd84d, 0xdc56, 0x000e, 0x0003, };
|
|
const uint8_t expectedtest3[] = { 0x00, 0x05, 0xff, 0x07, 0xff, 0x01, 0x02, 0x0b, 0x01, 0x02, 0x0a, 0xff, 0xff,};
|
|
int32_t totest3Offs[] = { 0, 1, 2, 3, 5, 7, 7, 7, 8, 8, 8, 10, 11};
|
|
|
|
const uint8_t test3input[] = { 0x00, 0x05, 0x06, 0x01, 0x02, 0x0b, 0x07, 0x01, 0x02, 0x0a,
|
|
0x01, 0x02, 0x0e, 0x01, 0x02, 0x0d, 0x03, 0x01, 0x02, 0x0f,};
|
|
const UChar expectedUnicode[] = { 0x20ac, 0x0005, 0x0006, 0x000b, 0xdbc4, 0xde34, 0xd84d, 0xdc56,
|
|
0x000e, 0xd891, 0xdd67, 0xfffd, 0xfffd };
|
|
int32_t fromtest3Offs[] = { 0, 1, 2, 3, 6, 6, 7, 7, 10, 13, 13, 16, 17};
|
|
|
|
/*from Unicode*/
|
|
if(!testConvertFromUnicode(unicodeInput, UPRV_LENGTHOF(unicodeInput),
|
|
expectedtest3, sizeof(expectedtest3), "@test3", TRUE, totest3Offs ))
|
|
log_err("u-> test3(MBCS conversion with three-byte) did not match.\n");
|
|
|
|
/*to Unicode*/
|
|
if(!testConvertToUnicode(test3input, sizeof(test3input),
|
|
expectedUnicode, UPRV_LENGTHOF(expectedUnicode), "@test3", TRUE, fromtest3Offs ))
|
|
log_err("test3(MBCS conversion with three-byte) -> u did not match.\n");
|
|
|
|
}
|
|
|
|
/*some more test to increase the code coverage in MBCS. Create an test converter from test4.ucm
|
|
which is test file for MBCS conversion with four-byte codepage data.*/
|
|
{
|
|
|
|
/* MBCS with three byte codepage data test4.ucm*/
|
|
const UChar unicodeInput[] =
|
|
{ 0x20ac, 0x0005, 0x0006, 0x000b, 0xdbc4, 0xde34, 0xdbba, 0xdfcd,
|
|
0xd84d, 0xdc56, 0x000e, 0xd891, 0xdd67, 0x000f};
|
|
const uint8_t expectedtest4[] =
|
|
{ 0x00, 0x05, 0xff, 0x01, 0x02, 0x03, 0x0b, 0x07, 0xff,
|
|
0x01, 0x02, 0x03, 0x0a, 0xff, 0xff, 0xff};
|
|
int32_t totest4Offs[] =
|
|
{ 0, 1, 2, 3, 3, 3, 3, 4, 6, 8, 8, 8, 8, 10, 11, 13};
|
|
|
|
const uint8_t test4input[] =
|
|
{ 0x00, 0x05, 0x06, 0x01, 0x02, 0x03, 0x0b, 0x07, 0x08,
|
|
0x01, 0x02, 0x03, 0x0a, 0x01, 0x02, 0x03, 0x0e, 0x01, 0x02, 0x03, 0x0d, 0x03, 0x01, 0x02, 0x03, 0x0c,};
|
|
const UChar expectedUnicode[] =
|
|
{ 0x20ac, 0x0005, 0x0006, 0x000b, 0xdbc4, 0xde34, 0xdbba, 0xdfcd,
|
|
0xd84d, 0xdc56, 0x000e, 0xd891, 0xdd67, 0x1a, 0xfffd};
|
|
int32_t fromtest4Offs[] =
|
|
{ 0, 1, 2, 3, 7, 7, 8, 8, 9, 9, 13, 17, 17, 21, 22,};
|
|
|
|
/*from Unicode*/
|
|
if(!testConvertFromUnicode(unicodeInput, UPRV_LENGTHOF(unicodeInput),
|
|
expectedtest4, sizeof(expectedtest4), "@test4", TRUE, totest4Offs ))
|
|
log_err("u-> test4(MBCS conversion with four-byte) did not match.\n");
|
|
|
|
/*to Unicode*/
|
|
if(!testConvertToUnicode(test4input, sizeof(test4input),
|
|
expectedUnicode, UPRV_LENGTHOF(expectedUnicode), "@test4", TRUE, fromtest4Offs ))
|
|
log_err("test4(MBCS conversion with four-byte) -> u did not match.\n");
|
|
|
|
}
|
|
/* Test for jitterbug 509 EBCDIC_STATEFUL Converters*/
|
|
{
|
|
const UChar unicodeInput[] = {0x00AF, 0x2013, 0x2223, 0x004C, 0x5F5D, 0xFF5E };
|
|
const uint8_t expectedtest1[] = {0x0E,0x42,0xA1, 0x44,0x4A, 0x42,0x4F, 0x0F,0xD3, 0x0E,0x65,0x60, 0x43,0xA1,0x0f };
|
|
int32_t totest1Offs[] = {0, 0, 0, 1, 1, 2, 2, 3, 3, 4, 4, 4, 5, 5, 5 };
|
|
const uint8_t test1input[] = {0x0E,0x42,0xA1, 0x44,0x4A, 0x42,0x4F, 0x0F,0xD3, 0x0E,0x65,0x60, 0x43,0xA1 };
|
|
const UChar expectedUnicode[] = {0x203e, 0x2014, 0xff5c, 0x004c, 0x5f5e, 0x223c };
|
|
int32_t fromtest1Offs[] = {1, 3, 5, 8, 10, 12 };
|
|
/*from Unicode*/
|
|
if(!testConvertFromUnicode(unicodeInput, UPRV_LENGTHOF(unicodeInput),
|
|
expectedtest1, sizeof(expectedtest1), "ibm-1371", TRUE, totest1Offs ))
|
|
log_err("u-> ibm-1371(MBCS conversion with single-byte) did not match.,\n");
|
|
/*to Unicode*/
|
|
if(!testConvertToUnicode(test1input, sizeof(test1input),
|
|
expectedUnicode, UPRV_LENGTHOF(expectedUnicode), "ibm-1371", TRUE, fromtest1Offs ))
|
|
log_err("ibm-1371(MBCS conversion with single-byte) -> u did not match.,\n");
|
|
}
|
|
|
|
}
|
|
#endif
|