/******************************************************************** * COPYRIGHT: * Copyright (c) 1997-2001, International Business Machines Corporation and * others. All Rights Reserved. ********************************************************************/ /******************************************************************************** * * File CU_CAPITST.C * * Modification History: * Name Description * Madhu Katragadda Ported for C API ********************************************************************************* */ #include #include "ccapitst.h" #include "unicode/uloc.h" #include "unicode/ucnv.h" #include "unicode/ucnv_err.h" #include "cintltst.h" #include "unicode/utypes.h" #include "unicode/ustring.h" #include "cstring.h" #include "cmemory.h" #define LENGTHOF(array) (sizeof(array)/sizeof((array)[0])) #define NUM_CODEPAGE 1 #define MAX_FILE_LEN 1024*20 #define UCS_FILE_NAME_SIZE 512 /*returns an action other than the one provided*/ static UConverterFromUCallback otherUnicodeAction(UConverterFromUCallback MIA); static UConverterToUCallback otherCharAction(UConverterToUCallback MIA); static void TestDuplicateAlias(void); static void TestCCSID(void); static void TestJ932(void); static void TestJ1968(void); static void TestConvertSafeCloneCallback(void); static void TestEBCDICSwapLFNL(void); void addTestConvert(TestNode** root); void addTestConvert(TestNode** root) { addTest(root, &TestConvert, "tsconv/ccapitst/TestConvert"); addTest(root, &TestAlias, "tsconv/ccapitst/TestAlias"); addTest(root, &TestDuplicateAlias, "tsconv/ccapitst/TestDuplicateAlias"); addTest(root, &TestConvertSafeClone, "tsconv/ccapitst/TestConvertSafeClone"); addTest(root, &TestConvertSafeCloneCallback, "tsconv/ccapitst/TestConvertSafeCloneCallback"); addTest(root, &TestCCSID, "tsconv/ccapitst/TestCCSID"); addTest(root, &TestJ932, "tsconv/ccapitst/TestJ932"); addTest(root, &TestJ1968, "tsconv/ccapitst/TestJ1968"); addTest(root, &TestEBCDICSwapLFNL, "tsconv/ccapitst/TestEBCDICSwapLFNL"); } static void TestConvert() { char myptr[4]; char save[4]; int32_t testLong1 = 0; uint16_t rest = 0; int32_t len = 0; int32_t x = 0; FILE* ucs_file_in = NULL; UChar BOM = 0x0000; UChar myUChar = 0x0000; char* mytarget; /* [MAX_FILE_LEN] */ char* mytarget_1; char* mytarget_use; UChar* consumedUni = NULL; char* consumed = NULL; char* output_cp_buffer; /* [MAX_FILE_LEN] */ UChar* ucs_file_buffer; /* [MAX_FILE_LEN] */ UChar* ucs_file_buffer_use; UChar* my_ucs_file_buffer; /* [MAX_FILE_LEN] */ UChar* my_ucs_file_buffer_1; int8_t ii = 0; int32_t j = 0; uint16_t codepage_index = 0; uint16_t count; int32_t cp = 0; UErrorCode err = U_ZERO_ERROR; const char* available_conv; char ucs_file_name[UCS_FILE_NAME_SIZE]; UConverterFromUCallback MIA1, MIA1_2; UConverterToUCallback MIA2, MIA2_2; const void *MIA1Context, *MIA1Context2, *MIA2Context, *MIA2Context2; UConverter* someConverters[5]; UConverter* myConverter = 0; UChar* displayname = 0; const char* locale; UChar* uchar1 = 0; UChar* uchar2 = 0; UChar* uchar3 = 0; int32_t targetcapacity2; int32_t targetcapacity; int32_t targetsize; int32_t disnamelen; const UChar* tmp_ucs_buf; const UChar* tmp_consumedUni=NULL; const char* tmp_mytarget_use; const char* tmp_consumed; int flushCount = 0; /****************************************************************** Checking Unicode -> ksc ******************************************************************/ const char* CodePagesToTest[NUM_CODEPAGE] = { "ibm-949_P110-2000" }; const uint16_t CodePageNumberToTest[NUM_CODEPAGE] = { 949 }; const int8_t CodePagesMinChars[NUM_CODEPAGE] = { 1 }; const int8_t CodePagesMaxChars[NUM_CODEPAGE] = { 2 }; const uint16_t CodePagesSubstitutionChars[NUM_CODEPAGE] = { 0xAFFE }; const char* CodePagesTestFiles[NUM_CODEPAGE] = { "uni-text.bin" }; const UConverterPlatform CodePagesPlatform[NUM_CODEPAGE] = { UCNV_IBM }; const char* CodePagesLocale[NUM_CODEPAGE] = { "ko_KR" }; UConverterFromUCallback oldFromUAction = NULL; UConverterToUCallback oldToUAction = NULL; const void* oldFromUContext = NULL; const void* oldToUContext = NULL; /* Allocate memory */ mytarget = (char*) malloc(MAX_FILE_LEN * sizeof(mytarget[0])); output_cp_buffer = (char*) malloc(MAX_FILE_LEN * sizeof(output_cp_buffer[0])); ucs_file_buffer = (UChar*) malloc(MAX_FILE_LEN * sizeof(ucs_file_buffer[0])); my_ucs_file_buffer = (UChar*) malloc(MAX_FILE_LEN * sizeof(my_ucs_file_buffer[0])); ucs_file_buffer_use = ucs_file_buffer; mytarget_1=mytarget; mytarget_use = mytarget; my_ucs_file_buffer_1=my_ucs_file_buffer; /* flush the converter cache to get a consistent state before the flushing is tested */ flushCount = ucnv_flushCache(); /*Calling all the UnicodeConverterCPP API and checking functionality*/ /*Tests ucnv_getAvailableName(), getAvialableCount()*/ log_verbose("Testing ucnv_countAvailable()..."); testLong1=ucnv_countAvailable(); log_info("Number of available Codepages: %d\n", testLong1); log_verbose("\n---Testing ucnv_getAvailableName.."); /*need to check this out */ available_conv = ucnv_getAvailableName(testLong1); /*test ucnv_getAvailableName with err condition*/ log_verbose("\n---Testing ucnv_getAvailableName..with index < 0 "); available_conv = ucnv_getAvailableName(-1); if(available_conv != NULL){ log_err("ucnv_getAvailableName() with index < 0) should return NULL\n"); } /* Test ucnv_countAliases() etc. */ count = ucnv_countAliases("utf-8", &err); if(U_FAILURE(err)) { log_err("FAILURE! ucnv_countAliases(\"utf-8\") -> %s\n", myErrorName(err)); } else if(count <= 0) { log_err("FAILURE! ucnv_countAliases(\"utf-8\") -> %d aliases\n", count); } else { /* try to get the aliases individually */ const char *alias; alias = ucnv_getAlias("utf-8", 0, &err); if(U_FAILURE(err)) { log_err("FAILURE! ucnv_getAlias(\"utf-8\", 0) -> %s\n", myErrorName(err)); } else if(uprv_strcmp("UTF-8", alias) != 0) { log_err("FAILURE! ucnv_getAlias(\"utf-8\", 0) -> %s instead of UTF-8\n", alias); } else { uint16_t aliasNum; for(aliasNum = 0; aliasNum < count; ++aliasNum) { alias = ucnv_getAlias("utf-8", aliasNum, &err); if(U_FAILURE(err)) { log_err("FAILURE! ucnv_getAlias(\"utf-8\", %d) -> %s\n", aliasNum, myErrorName(err)); } else if(uprv_strlen(alias) > 20) { /* sanity check */ log_err("FAILURE! ucnv_getAlias(\"utf-8\", %d) -> alias %s insanely long, corrupt?!\n", aliasNum, alias); } else { log_verbose("alias %d for utf-8: %s\n", aliasNum, alias); } } if(U_SUCCESS(err)) { /* try to fill an array with all aliases */ const char **aliases; aliases=(const char **)malloc(count * sizeof(const char *)); if(aliases != 0) { ucnv_getAliases("utf-8", aliases, &err); if(U_FAILURE(err)) { log_err("FAILURE! ucnv_getAliases(\"utf-8\") -> %s\n", myErrorName(err)); } else { for(aliasNum = 0; aliasNum < count; ++aliasNum) { /* compare the pointers with the ones returned individually */ alias = ucnv_getAlias("utf-8", aliasNum, &err); if(U_FAILURE(err)) { log_err("FAILURE! ucnv_getAlias(\"utf-8\", %d) -> %s\n", aliasNum, myErrorName(err)); } else if(aliases[aliasNum] != alias) { log_err("FAILURE! ucnv_getAliases(\"utf-8\")[%d] != ucnv_getAlias(\"utf-8\", %d)\n", aliasNum, aliasNum); } } } free((char **)aliases); } } } } /*Testing ucnv_openU()*/ { UChar converterName[]={ 0x0069, 0x0062, 0x006d, 0x002d, 0x0039, 0x0034, 0x0033, 0x0000}; /*ibm-943*/ UChar firstSortedName[]={ 0x0021, 0x0000}; /* ! */ UChar lastSortedName[]={ 0x007E, 0x0000}; /* ~ */ const char *illegalNameChars={ "ibm-943 ibm-943 ibm-943 ibm-943 ibm-943 ibm-943 ibm-943 ibm-943 ibm-943 ibm-943"}; UChar illegalName[100]; UConverter *converter=NULL; err=U_ZERO_ERROR; converter=ucnv_openU(converterName, &err); if(U_FAILURE(err)){ log_err("FAILURE! ucnv_openU(ibm-943, err) failed. %s\n", myErrorName(err)); } ucnv_close(converter); err=U_ZERO_ERROR; converter=ucnv_openU(NULL, &err); if(U_FAILURE(err)){ log_err("FAILURE! ucnv_openU(NULL, err) failed. %s\n", myErrorName(err)); } ucnv_close(converter); /*testing with error value*/ err=U_ILLEGAL_ARGUMENT_ERROR; converter=ucnv_openU(converterName, &err); if(!(converter == NULL)){ log_err("FAILURE! ucnv_openU(ibm-943, U_ILLEGAL_ARGUMENT_ERROR) is expected to fail\n"); } ucnv_close(converter); err=U_ZERO_ERROR; u_uastrcpy(illegalName, ""); u_uastrcpy(illegalName, illegalNameChars); ucnv_openU(illegalName, &err); if(!(err==U_ILLEGAL_ARGUMENT_ERROR)){ log_err("FAILURE! ucnv_openU(illegalName, err) is expected to fail\n"); } err=U_ZERO_ERROR; ucnv_openU(firstSortedName, &err); if(err!=U_FILE_ACCESS_ERROR){ log_err("FAILURE! ucnv_openU(firstSortedName, err) is expected to fail\n"); } err=U_ZERO_ERROR; ucnv_openU(lastSortedName, &err); if(err!=U_FILE_ACCESS_ERROR){ log_err("FAILURE! ucnv_openU(lastSortedName, err) is expected to fail\n"); } err=U_ZERO_ERROR; } log_verbose("Testing ucnv_open() with converter name greater than 7 characters\n"); { UConverter *cnv=NULL; err=U_ZERO_ERROR; cnv=ucnv_open("ibm-949,Madhu", &err); if(U_FAILURE(err)){ log_err("FAILURE! ucnv_open(\"ibm-949,Madhu\", err) failed. %s\n", myErrorName(err)); } ucnv_close(cnv); } /*Testing ucnv_convert()*/ { int32_t targetLimit=0, sourceLimit=0, i=0, targetCapacity=0; const uint8_t source[]={ 0x00, 0x04, 0x05, 0x06, 0xa2, 0xb4, 0x00}; const uint8_t expectedTarget[]={ 0x00, 0x37, 0x2d, 0x2e, 0x0e, 0x49, 0x62, 0x0f, 0x00}; char *target=0; sourceLimit=sizeof(source)/sizeof(source[0]); err=U_ZERO_ERROR; targetLimit=0; targetCapacity=ucnv_convert("ibm-1364", "ibm-1363", NULL, targetLimit , (const char*)source, sourceLimit, &err); if(err == U_BUFFER_OVERFLOW_ERROR){ err=U_ZERO_ERROR; targetLimit=targetCapacity+1; target=(char*)malloc(sizeof(char) * targetLimit); targetCapacity=ucnv_convert("ibm-1364", "ibm-1363", target, targetLimit , (const char*)source, sourceLimit, &err); } if(U_FAILURE(err)){ log_err("FAILURE! ucnv_convert(ibm-1363->ibm-1364) failed. %s\n", myErrorName(err)); } else { for(i=0; iibm-1364) failed.at index \n i=%d, Expected: %lx Got: %lx\n", i, (UChar)expectedTarget[i], (uint8_t)target[i]); } } /*Test error conditions*/ i=ucnv_convert("ibm-1364", "ibm-1363", target, targetLimit , (const char*)source, 0, &err); if(i !=0){ log_err("FAILURE! ucnv_convert() with sourceLimit=0 is expected to return 0\n"); } ucnv_convert("ibm-1364", "ibm-1363", target, targetLimit , (const char*)source, -1, &err); if(!(U_FAILURE(err) && err==U_ILLEGAL_ARGUMENT_ERROR)){ log_err("FAILURE! ucnv_convert() with sourceLimit=-1 is expected to fail\n"); } sourceLimit=sizeof(source)/sizeof(source[0]); i=ucnv_convert("ibm-1364", "ibm-1363", target, targetLimit , (const char*)source, sourceLimit, &err); if(i !=0 ){ log_err("FAILURE! ucnv_convert() with err=U_ILLEGAL_ARGUMENT_ERROR is expected to return 0\n"); } err=U_ZERO_ERROR; sourceLimit=sizeof(source)/sizeof(source[0]); targetLimit=0; i=ucnv_convert("ibm-1364", "ibm-1363", target, targetLimit , (const char*)source, sourceLimit, &err); if(!(U_FAILURE(err) && err==U_BUFFER_OVERFLOW_ERROR)){ log_err("FAILURE! ucnv_convert() with targetLimit=0 is expected to throw U_BUFFER_OVERFLOW_ERROR\n"); } err=U_ZERO_ERROR; free(target); ucnv_flushCache(); } } /*Testing ucnv_open()*/ /* Note: These converters have been chosen because they do NOT encode the Latin characters (U+0041, ...), and therefore are highly unlikely to be chosen as system default codepages */ someConverters[0] = ucnv_open("ibm-1047", &err); if (U_FAILURE(err)) { log_err("FAILURE! %s\n", myErrorName(err)); } someConverters[1] = ucnv_open("ibm-1047", &err); if (U_FAILURE(err)) { log_err("FAILURE! %s\n", myErrorName(err)); } someConverters[2] = ucnv_open("ibm-1047", &err); if (U_FAILURE(err)) { log_err("FAILURE! %s\n", myErrorName(err)); } someConverters[3] = ucnv_open("gb18030", &err); if (U_FAILURE(err)) { log_err("FAILURE! %s\n", myErrorName(err)); } someConverters[4] = ucnv_open("ibm-949", &err); if (U_FAILURE(err)) { log_err("FAILURE! %s\n", myErrorName(err)); } /* Testing ucnv_flushCache() */ log_verbose("\n---Testing ucnv_flushCache...\n"); if ((flushCount=ucnv_flushCache())==0) log_verbose("Flush cache ok\n"); else log_err("Flush Cache failed [line %d], expect 0 got %d \n", __LINE__, flushCount); /*testing ucnv_close() and ucnv_flushCache() */ ucnv_close(someConverters[0]); ucnv_close(someConverters[1]); ucnv_close(someConverters[2]); ucnv_close(someConverters[3]); if ((flushCount=ucnv_flushCache())==2) log_verbose("Flush cache ok\n"); /*because first, second and third are same */ else log_err("Flush Cache failed line %d, got %d expected 2 or there is an error in ucnv_close()\n", __LINE__, flushCount); ucnv_close(someConverters[4]); if ( (flushCount=ucnv_flushCache())==1) log_verbose("Flush cache ok\n"); else log_err("Flush Cache failed line %d, expected 1 got %d \n", __LINE__, flushCount); /*Testing ucnv_openCCSID and ucnv_open with error conditions*/ log_verbose("\n---Testing ucnv_open with err ! = U_ZERO_ERROR...\n"); err=U_ILLEGAL_ARGUMENT_ERROR; if(ucnv_open(NULL, &err) != NULL){ log_err("ucnv_open with err != U_ZERO_ERROR is supposed to fail\n"); } if(ucnv_openCCSID(1051, UCNV_IBM, &err) != NULL){ log_err("ucnv_open with err != U_ZERO_ERROR is supposed to fail\n"); } err=U_ZERO_ERROR; /* Testing ucnv_openCCSID(), ucnv_open(), ucnv_getName() */ log_verbose("\n---Testing ucnv_open default...\n"); someConverters[0] = ucnv_open(NULL,&err); someConverters[1] = ucnv_open(NULL,&err); someConverters[2] = ucnv_open("utf8", &err); someConverters[3] = ucnv_openCCSID(949,UCNV_IBM,&err); ucnv_close(ucnv_openCCSID(1051, UCNV_IBM, &err)); /* test for j350; ucnv_close(NULL) is safe */ if (U_FAILURE(err)){ log_err("FAILURE! %s\n", myErrorName(err));} /* Testing ucnv_getName()*/ /*default code page */ ucnv_getName(someConverters[0], &err); if(U_FAILURE(err)) { log_err("getName[0] failed\n"); } else { log_verbose("getName(someConverters[0]) returned %s\n", ucnv_getName(someConverters[0], &err)); } ucnv_getName(someConverters[1], &err); if(U_FAILURE(err)) { log_err("getName[1] failed\n"); } else { log_verbose("getName(someConverters[1]) returned %s\n", ucnv_getName(someConverters[1], &err)); } /*Testing ucnv_getDefaultName() and ucnv_setDefaultNAme()*/ { const char* defaultName=ucnv_getDefaultName(); log_verbose("getDefaultName returned %s\n", defaultName); /*change the default name by setting it */ ucnv_setDefaultName("changed"); if(strcmp(ucnv_getDefaultName(), "changed")==0) log_verbose("setDefaultName o.k"); else log_err("setDefaultName failed"); /*set the default name back*/ ucnv_setDefaultName(defaultName); } ucnv_close(someConverters[0]); ucnv_close(someConverters[1]); ucnv_close(someConverters[2]); ucnv_close(someConverters[3]); for (codepage_index=0; codepage_index < NUM_CODEPAGE; ++codepage_index) { int32_t i = 0; char* index = NULL; strcpy(ucs_file_name, loadTestData(&err)); if(U_FAILURE(err)){ log_err("Couldn't get the test data directory... Exiting...Error:%s\n", u_errorName(err)); return; } index=strrchr(ucs_file_name,(char)U_FILE_SEP_CHAR); if((unsigned int)(index-ucs_file_name) != (strlen(ucs_file_name)-1)){ *(index+1)=0; } strcat(ucs_file_name,".."U_FILE_SEP_STRING); strcat(ucs_file_name, CodePagesTestFiles[codepage_index]); ucs_file_in = fopen(ucs_file_name,"rb"); if (!ucs_file_in) { log_err("Couldn't open the Unicode file [%s]... Exiting...\n", ucs_file_name); return; } /*Creates a converter and testing ucnv_openCCSID(u_int code_page, platform, errstatus*/ /* myConverter =ucnv_openCCSID(CodePageNumberToTest[codepage_index],UCNV_IBM, &err); */ /* ucnv_flushCache(); */ myConverter =ucnv_open( "ibm-949", &err); if (!myConverter || U_FAILURE(err)) { log_err("Error creating the convertor \n"); return; } /*testing for ucnv_getName() */ log_verbose("Testing ucnv_getName()...\n"); ucnv_getName(myConverter, &err); if(U_FAILURE(err)) log_err("Error in getName\n"); else { log_verbose("getName o.k. %s\n", ucnv_getName(myConverter, &err)); } if (uprv_stricmp(ucnv_getName(myConverter, &err), CodePagesToTest[codepage_index])) log_err("getName failed\n"); else log_verbose("getName ok\n"); /*Test getName with error condition*/ { const char* name=0; err=U_ILLEGAL_ARGUMENT_ERROR; log_verbose("Testing ucnv_getName with err != U_ZERO_ERROR"); name=ucnv_getName(myConverter, &err); if(name != NULL){ log_err("ucnv_getName() with err != U_ZERO_ERROR is expected to fail"); } err=U_ZERO_ERROR; } /*Tests ucnv_getMaxCharSize() and ucnv_getMinCharSize()*/ log_verbose("Testing ucnv_getMaxCharSize()...\n"); if (ucnv_getMaxCharSize(myConverter)==CodePagesMaxChars[codepage_index]) log_verbose("Max byte per character OK\n"); else log_err("Max byte per character failed\n"); log_verbose("\n---Testing ucnv_getMinCharSize()...\n"); if (ucnv_getMinCharSize(myConverter)==CodePagesMinChars[codepage_index]) log_verbose("Min byte per character OK\n"); else log_err("Min byte per character failed\n"); /*Testing for ucnv_getSubstChars() and ucnv_setSubstChars()*/ log_verbose("\n---Testing ucnv_getSubstChars...\n"); ii=4; ucnv_getSubstChars(myConverter, myptr, &ii, &err); for(x=0;x> 8) | (myUChar << 8))); /*adjust if BIG_ENDIAN*/ } myUChar = ucs_file_buffer[i-1]; ucs_file_buffer[i-1] = (UChar)((BOM==0xFEFF)?myUChar:((myUChar >> 8) | (myUChar << 8))); /*adjust if BIG_ENDIAN Corner Case*/ /*testing ucnv_fromUChars() and ucnv_toUChars() */ /*uchar1---fromUChar--->output_cp_buffer --toUChar--->uchar2*/ uchar1=(UChar*)malloc(sizeof(UChar) * (i+1)); u_uastrcpy(uchar1,""); u_strncpy(uchar1,ucs_file_buffer,i); uchar1[i] = 0; uchar3=(UChar*)malloc(sizeof(UChar)*(i+1)); u_uastrcpy(uchar3,""); u_strncpy(uchar3,ucs_file_buffer,i); uchar3[i] = 0; /*Calls the Conversion Routine */ testLong1 = MAX_FILE_LEN; log_verbose("\n---Testing ucnv_fromUChars()\n"); targetcapacity = ucnv_fromUChars(myConverter, output_cp_buffer, testLong1, uchar1, -1, &err); if (U_FAILURE(err)) { log_err("\nFAILURE...%s\n", myErrorName(err)); } else log_verbose(" ucnv_fromUChars() o.k.\n"); /*test the conversion routine */ log_verbose("\n---Testing ucnv_toUChars()\n"); /*call it first time for trapping the targetcapacity and size needed to allocate memory for the buffer uchar2 */ targetcapacity2=0; targetsize = ucnv_toUChars(myConverter, NULL, targetcapacity2, output_cp_buffer, strlen(output_cp_buffer), &err); /*if there is an buffer overflow then trap the values and pass them and make the actual call*/ if(err==U_BUFFER_OVERFLOW_ERROR) { err=U_ZERO_ERROR; uchar2=(UChar*)malloc((targetsize+1) * sizeof(UChar)); targetsize = ucnv_toUChars(myConverter, uchar2, targetsize+1, output_cp_buffer, strlen(output_cp_buffer), &err); if(U_FAILURE(err)) log_err("ucnv_toUChars() FAILED %s\n", myErrorName(err)); else log_verbose(" ucnv_toUChars() o.k.\n"); if(u_strcmp(uchar1,uchar2)!=0) log_err("equality test failed with conversion routine\n"); } else { log_err("ERR: calling toUChars: Didn't get U_BUFFER_OVERFLOW .. expected it.\n"); } /*Testing ucnv_fromUChars and ucnv_toUChars with error conditions*/ err=U_ILLEGAL_ARGUMENT_ERROR; log_verbose("\n---Testing ucnv_fromUChars() with err != U_ZERO_ERROR\n"); targetcapacity = ucnv_fromUChars(myConverter, output_cp_buffer, testLong1, uchar1, -1, &err); if (targetcapacity !=0) { log_err("\nFAILURE: ucnv_fromUChars with err != U_ZERO_ERROR is expected to fail and return 0\n"); } err=U_ZERO_ERROR; log_verbose("\n---Testing ucnv_fromUChars() with converter=NULL\n"); targetcapacity = ucnv_fromUChars(NULL, output_cp_buffer, testLong1, uchar1, -1, &err); if (targetcapacity !=0 || err != U_ILLEGAL_ARGUMENT_ERROR) { log_err("\nFAILURE: ucnv_fromUChars with converter=NULL is expected to fail\n"); } err=U_ZERO_ERROR; log_verbose("\n---Testing ucnv_fromUChars() with sourceLength = 0\n"); targetcapacity = ucnv_fromUChars(myConverter, output_cp_buffer, testLong1, uchar1, 0, &err); if (targetcapacity !=0) { log_err("\nFAILURE: ucnv_fromUChars with sourceLength 0 is expected to return 0\n"); } log_verbose("\n---Testing ucnv_fromUChars() with targetLength = 0\n"); targetcapacity = ucnv_fromUChars(myConverter, output_cp_buffer, 0, uchar1, -1, &err); if (err != U_BUFFER_OVERFLOW_ERROR) { log_err("\nFAILURE: ucnv_fromUChars with targetLength 0 is expected to fail and throw U_BUFFER_OVERFLOW_ERROR\n"); } /*toUChars with error conditions*/ targetsize = ucnv_toUChars(myConverter, uchar2, targetsize, output_cp_buffer, strlen(output_cp_buffer), &err); if(targetsize != 0){ log_err("\nFAILURE: ucnv_toUChars with err != U_ZERO_ERROR is expected to fail and return 0\n"); } err=U_ZERO_ERROR; targetsize = ucnv_toUChars(myConverter, uchar2, -1, output_cp_buffer, strlen(output_cp_buffer), &err); if(targetsize != 0 || err != U_ILLEGAL_ARGUMENT_ERROR){ log_err("\nFAILURE: ucnv_toUChars with targetsize < 0 is expected to throw U_ILLEGAL_ARGUMENT_ERROR and return 0\n"); } err=U_ZERO_ERROR; targetsize = ucnv_toUChars(myConverter, uchar2, 0, output_cp_buffer, 0, &err); if (targetsize !=0) { log_err("\nFAILURE: ucnv_toUChars with sourceLength 0 is expected to return 0\n"); } targetcapacity2=0; targetsize = ucnv_toUChars(myConverter, NULL, targetcapacity2, output_cp_buffer, strlen(output_cp_buffer), &err); if (err != U_STRING_NOT_TERMINATED_WARNING) { log_err("\nFAILURE: ucnv_toUChars(targetLength)->%s instead of U_STRING_NOT_TERMINATED_WARNING\n", u_errorName(err)); } err=U_ZERO_ERROR; /*-----*/ /*testing for ucnv_fromUnicode() and ucnv_toUnicode() */ /*Clean up re-usable vars*/ j=0; log_verbose("Testing ucnv_fromUnicode().....\n"); tmp_ucs_buf=ucs_file_buffer_use; ucnv_fromUnicode(myConverter, &mytarget_1, mytarget + MAX_FILE_LEN, &tmp_ucs_buf, ucs_file_buffer_use+i, NULL, TRUE, &err); consumedUni = (UChar*)tmp_consumedUni; if (U_FAILURE(err)) { log_err("FAILURE! %s\n", myErrorName(err)); } else log_verbose("ucnv_fromUnicode() o.k.\n"); /*Uni1 ----ToUnicode----> Cp2 ----FromUnicode---->Uni3 */ log_verbose("Testing ucnv_toUnicode().....\n"); tmp_mytarget_use=mytarget_use; tmp_consumed = consumed; ucnv_toUnicode(myConverter, &my_ucs_file_buffer_1, my_ucs_file_buffer + MAX_FILE_LEN, &tmp_mytarget_use, mytarget_use + (mytarget_1 - mytarget), NULL, FALSE, &err); consumed = (char*)tmp_consumed; if (U_FAILURE(err)) { log_err("FAILURE! %s\n", myErrorName(err)); } else log_verbose("ucnv_toUnicode() o.k.\n"); log_verbose("\n---Testing RoundTrip ...\n"); u_strncpy(uchar3, my_ucs_file_buffer,i); uchar3[i] = 0; if(u_strcmp(uchar1,uchar3)==0) log_verbose("Equality test o.k.\n"); else log_err("Equality test failed\n"); /*sanity compare */ if(uchar2 == NULL) { log_err("uchar2 was NULL (ccapitst.c line %d), couldn't do sanity check\n", __LINE__); } else { if(u_strcmp(uchar2, uchar3)==0) log_verbose("Equality test o.k.\n"); else log_err("Equality test failed\n"); } fclose(ucs_file_in); ucnv_close(myConverter); free(displayname); if (uchar1 != 0) free(uchar1); if (uchar2 != 0) free(uchar2); if (uchar3 != 0) free(uchar3); } free((void*)mytarget); free((void*)output_cp_buffer); free((void*)ucs_file_buffer); free((void*)my_ucs_file_buffer); } static UConverterFromUCallback otherUnicodeAction(UConverterFromUCallback MIA) { return (MIA==(UConverterFromUCallback)UCNV_FROM_U_CALLBACK_STOP)?(UConverterFromUCallback)UCNV_FROM_U_CALLBACK_SUBSTITUTE:(UConverterFromUCallback)UCNV_FROM_U_CALLBACK_STOP; } static UConverterToUCallback otherCharAction(UConverterToUCallback MIA) { return (MIA==(UConverterToUCallback)UCNV_TO_U_CALLBACK_STOP)?(UConverterToUCallback)UCNV_TO_U_CALLBACK_SUBSTITUTE:(UConverterToUCallback)UCNV_TO_U_CALLBACK_STOP; } /** * Test the converter alias API, specifically the fuzzy matching of * alias names and the alias table integrity. Make sure each * converter has at least one alias (itself), and that its listed * aliases map back to itself. Check some hard-coded UTF-8 and * ISO_2022 aliases to make sure they work. */ static void TestAlias() { int32_t i, ncnv; UErrorCode status = U_ZERO_ERROR; /* Predetermined aliases that we expect to map back to ISO_2022 * and UTF-8. UPDATE THIS DATA AS NECESSARY. */ const char* ISO_2022_NAMES[] = {"ISO_2022", "iso-2022", "2022", "cp2022", "iso2022", "iso_2022"}; int32_t ISO_2022_NAMES_LENGTH = sizeof(ISO_2022_NAMES) / sizeof(ISO_2022_NAMES[0]); const char *UTF8_NAMES[] = { "UTF-8", "utf-8", "utf8", "ibm-1208", "utf_8", "ibm1208", "cp1208" }; int32_t UTF8_NAMES_LENGTH = sizeof(UTF8_NAMES) / sizeof(UTF8_NAMES[0]); struct { const char *name; const char *alias; } CONVERTERS_NAMES[] = { { "UTF-32BE", "UTF32_BigEndian" }, { "UTF-32LE", "UTF32_LittleEndian" }, { "UTF-32", "ISO-10646-UCS-4" }, { "UTF32_PlatformEndian", "UTF32_PlatformEndian" }, { "UTF-32", "ucs-4" } }; int32_t CONVERTERS_NAMES_LENGTH = sizeof(CONVERTERS_NAMES) / sizeof(*CONVERTERS_NAMES); /* When there are bugs in gencnval or in ucnv_io, converters can appear to have no aliases. */ ncnv = ucnv_countAvailable(); log_verbose("%d converters\n", ncnv); for (i=0; i " "alias[%d]=NULL\n", name, j); continue; } mapBack = ucnv_getAlias(alias, 0, &status); if (mapBack == NULL) { log_err("FAIL: Converter \"%s\" -> " "alias[%d]=\"%s\" -> " "alias[0]=NULL, exp. \"%s\"\n", name, j, alias, alias0); continue; } if (0 != uprv_strcmp(alias0, mapBack)) { int32_t idx; UBool foundAlias = FALSE; if (status == U_AMBIGUOUS_ALIAS_WARNING) { /* Make sure that we only get this mismapping when there is an ambiguous alias, and the other converter has this alias too. */ for (idx = 0; idx < ucnv_countAliases(mapBack, &status); idx++) { if (uprv_strcmp(ucnv_getAlias(mapBack, (uint16_t)idx, &status), alias) == 0) { foundAlias = TRUE; break; } } } /* else not ambiguous, and this is a real problem. foundAlias = FALSE */ if (!foundAlias) { log_err("FAIL: Converter \"%s\" -> " "alias[%d]=\"%s\" -> " "alias[0]=\"%s\", exp. \"%s\"\n", name, j, alias, mapBack, alias0); } } } } /* Check a list of predetermined aliases that we expect to map * back to ISO_2022 and UTF-8. */ for (i=1; i \"%s\", expect ISO_2022\n", ISO_2022_NAMES[i], mapBack); } } for (i=1; i \"%s\", expect UTF-8\n", UTF8_NAMES[i], mapBack); } } /* * Check a list of predetermined aliases that we expect to map * back to predermined converter names. */ for (i = 0; i < CONVERTERS_NAMES_LENGTH; ++i) { const char* mapBack = ucnv_getAlias(CONVERTERS_NAMES[i].alias, 0, &status); if (0 != uprv_strcmp(mapBack, CONVERTERS_NAMES[i].name)) { log_err("FAIL: \"%s\" -> \"%s\", expect %s\n", CONVERTERS_NAMES[i].alias, mapBack, CONVERTERS_NAMES[i].name); } } } static void TestDuplicateAlias(void) { const char *alias; UErrorCode status = U_ZERO_ERROR; status = U_ZERO_ERROR; alias = ucnv_getStandardName("Shift_JIS", "IBM", &status); if (alias == NULL || uprv_strcmp(alias, "ibm-943") != 0 || status != U_AMBIGUOUS_ALIAS_WARNING) { log_err("FAIL: Didn't get ibm-943 for Shift_JIS {IBM}. Got %s\n", alias); } status = U_ZERO_ERROR; alias = ucnv_getStandardName("ibm-943", "IANA", &status); if (alias == NULL || uprv_strcmp(alias, "Shift_JIS") != 0 || status != U_AMBIGUOUS_ALIAS_WARNING) { log_err("FAIL: Didn't get Shift_JIS for ibm-943 {IANA}. Got %s\n", alias); } status = U_ZERO_ERROR; alias = ucnv_getStandardName("ibm-943_P130-2000", "IANA", &status); if (alias != NULL || status == U_AMBIGUOUS_ALIAS_WARNING) { log_err("FAIL: Didn't get NULL for ibm-943 {IANA}. Got %s\n", alias); } } /* Test safe clone callback */ static uint32_t TSCC_nextSerial() { static uint32_t n = 1; return (n++); } typedef struct { uint32_t magic; /* 0xC0FFEE to identify that the object is OK */ uint32_t serial; /* minted from nextSerial, above */ UBool wasClosed; /* close happened on the object */ } TSCCContext; static TSCCContext *TSCC_clone(TSCCContext *ctx) { TSCCContext *newCtx; newCtx = malloc(sizeof(TSCCContext)); newCtx->serial = TSCC_nextSerial(); newCtx->wasClosed = 0; newCtx->magic = 0xC0FFEE; log_verbose("TSCC_clone: %p:%d -> new context %p:%d\n", ctx, ctx->serial, newCtx, newCtx->serial); return newCtx; } static void TSCC_fromU(const void *context, UConverterFromUnicodeArgs *fromUArgs, const UChar* codeUnits, int32_t length, UChar32 codePoint, UConverterCallbackReason reason, UErrorCode * err) { TSCCContext *ctx = (TSCCContext*)context; UConverterFromUCallback junkFrom; log_verbose("TSCC_fromU: Context %p:%d called, reason %d on cnv %p\n", ctx, ctx->serial, reason, fromUArgs->converter); if(ctx->magic != 0xC0FFEE) { log_err("TSCC_fromU: Context %p:%d magic is 0x%x should be 0xC0FFEE.\n", ctx,ctx->serial, ctx->magic); return; } if(reason == UCNV_CLONE) { UErrorCode subErr = U_ZERO_ERROR; TSCCContext *newCtx; TSCCContext *junkCtx; /* "recreate" it */ log_verbose("TSCC_fromU: cloning..\n"); newCtx = TSCC_clone(ctx); if(newCtx == NULL) { log_err("TSCC_fromU: internal clone failed on %p\n", ctx); } /* now, SET it */ ucnv_getFromUCallBack(fromUArgs->converter, &junkFrom, (const void**)&junkCtx); ucnv_setFromUCallBack(fromUArgs->converter, junkFrom, newCtx, NULL, NULL, &subErr); if(U_FAILURE(subErr)) { *err = subErr; } } if(reason == UCNV_CLOSE) { log_verbose("TSCC_fromU: Context %p:%d closing\n", ctx, ctx->serial); ctx->wasClosed = TRUE; } } static void TSCC_toU(const void *context, UConverterToUnicodeArgs *toUArgs, const char* codeUnits, int32_t length, UConverterCallbackReason reason, UErrorCode * err) { TSCCContext *ctx = (TSCCContext*)context; UConverterToUCallback junkFrom; log_verbose("TSCC_toU: Context %p:%d called, reason %d on cnv %p\n", ctx, ctx->serial, reason, toUArgs->converter); if(ctx->magic != 0xC0FFEE) { log_err("TSCC_toU: Context %p:%d magic is 0x%x should be 0xC0FFEE.\n", ctx,ctx->serial, ctx->magic); return; } if(reason == UCNV_CLONE) { UErrorCode subErr = U_ZERO_ERROR; TSCCContext *newCtx; TSCCContext *junkCtx; /* "recreate" it */ log_verbose("TSCC_toU: cloning..\n"); newCtx = TSCC_clone(ctx); if(newCtx == NULL) { log_err("TSCC_toU: internal clone failed on %p\n", ctx); } /* now, SET it */ ucnv_getToUCallBack(toUArgs->converter, &junkFrom, (const void**)&junkCtx); ucnv_setToUCallBack(toUArgs->converter, junkFrom, newCtx, NULL, NULL, &subErr); if(U_FAILURE(subErr)) { *err = subErr; } } if(reason == UCNV_CLOSE) { log_verbose("TSCC_toU: Context %p:%d closing\n", ctx, ctx->serial); ctx->wasClosed = TRUE; } } static void TSCC_init(TSCCContext *q) { q->magic = 0xC0FFEE; q->serial = TSCC_nextSerial(); q->wasClosed = 0; } static void TSCC_print_log(TSCCContext *q, const char *name) { if(q==NULL) { log_verbose("TSCContext: %s is NULL!!\n", name); } else { if(q->magic != 0xC0FFEE) { log_err("TSCCContext: %p:%d's magic is %x, supposed to be 0xC0FFEE\n", q,q->serial, q->magic); } log_verbose("TSCCContext %p:%d=%s - magic %x, %s\n", q, q->serial, name, q->magic, q->wasClosed?"CLOSED":"open"); } } static void TestConvertSafeCloneCallback() { UErrorCode err = U_ZERO_ERROR; TSCCContext from1, to1; TSCCContext *from2, *from3, *to2, *to3; char hunk[8192]; int32_t hunkSize = 8192; UConverterFromUCallback junkFrom; UConverterToUCallback junkTo; UConverter *conv1, *conv2 = NULL; conv1 = ucnv_open("iso-8859-3", &err); if(U_FAILURE(err)) { log_err("Err opening iso-8859-3, %s", u_errorName(err)); return; } log_verbose("Opened conv1=%p\n", conv1); TSCC_init(&from1); TSCC_init(&to1); TSCC_print_log(&from1, "from1"); TSCC_print_log(&to1, "to1"); ucnv_setFromUCallBack(conv1, TSCC_fromU, &from1, NULL, NULL, &err); log_verbose("Set from1 on conv1\n"); TSCC_print_log(&from1, "from1"); ucnv_setToUCallBack(conv1, TSCC_toU, &to1, NULL, NULL, &err); log_verbose("Set to1 on conv1\n"); TSCC_print_log(&to1, "to1"); conv2 = ucnv_safeClone(conv1, hunk, &hunkSize, &err); if(U_FAILURE(err)) { log_err("safeClone failed: %s\n", u_errorName(err)); return; } log_verbose("Cloned to conv2=%p.\n", conv2); /********** from *********************/ ucnv_getFromUCallBack(conv2, &junkFrom, (const void**)&from2); ucnv_getFromUCallBack(conv1, &junkFrom, (const void**)&from3); TSCC_print_log(from2, "from2"); TSCC_print_log(from3, "from3(==from1)"); if(from2 == NULL) { log_err("FAIL! from2 is null \n"); return; } if(from3 == NULL) { log_err("FAIL! from3 is null \n"); return; } if(from3 != (&from1) ) { log_err("FAIL! conv1's FROM context changed!\n"); } if(from2 == (&from1) ) { log_err("FAIL! conv1's FROM context is the same as conv2's!\n"); } if(from1.wasClosed) { log_err("FAIL! from1 is closed \n"); } if(from2->wasClosed) { log_err("FAIL! from2 was closed\n"); } /********** to *********************/ ucnv_getToUCallBack(conv2, &junkTo, (const void**)&to2); ucnv_getToUCallBack(conv1, &junkTo, (const void**)&to3); TSCC_print_log(to2, "to2"); TSCC_print_log(to3, "to3(==to1)"); if(to2 == NULL) { log_err("FAIL! to2 is null \n"); return; } if(to3 == NULL) { log_err("FAIL! to3 is null \n"); return; } if(to3 != (&to1) ) { log_err("FAIL! conv1's TO context changed!\n"); } if(to2 == (&to1) ) { log_err("FAIL! conv1's TO context is the same as conv2's!\n"); } if(to1.wasClosed) { log_err("FAIL! to1 is closed \n"); } if(to2->wasClosed) { log_err("FAIL! to2 was closed\n"); } /*************************************/ ucnv_close(conv1); log_verbose("ucnv_closed (conv1)\n"); TSCC_print_log(&from1, "from1"); TSCC_print_log(from2, "from2"); TSCC_print_log(&to1, "to1"); TSCC_print_log(to2, "to2"); if(from1.wasClosed == FALSE) { log_err("FAIL! from1 is NOT closed \n"); } if(from2->wasClosed) { log_err("FAIL! from2 was closed\n"); } if(to1.wasClosed == FALSE) { log_err("FAIL! to1 is NOT closed \n"); } if(to2->wasClosed) { log_err("FAIL! to2 was closed\n"); } ucnv_close(conv2); log_verbose("ucnv_closed (conv2)\n"); TSCC_print_log(&from1, "from1"); TSCC_print_log(from2, "from2"); if(from1.wasClosed == FALSE) { log_err("FAIL! from1 is NOT closed \n"); } if(from2->wasClosed == FALSE) { log_err("FAIL! from2 was NOT closed\n"); } TSCC_print_log(&to1, "to1"); TSCC_print_log(to2, "to2"); if(to1.wasClosed == FALSE) { log_err("FAIL! to1 is NOT closed \n"); } if(to2->wasClosed == FALSE) { log_err("FAIL! to2 was NOT closed\n"); } if(to2 != (&to1)) { free(to2); /* to1 is stack based */ } if(from2 != (&from1)) { free(from2); /* from1 is stack based */ } } static void TestConvertSafeClone() { #define CLONETEST_CONVERTER_COUNT 9 char charBuffer [21]; /* Leave at an odd number for alignment testing */ uint8_t buffer [CLONETEST_CONVERTER_COUNT] [U_CNV_SAFECLONE_BUFFERSIZE]; int32_t bufferSize = U_CNV_SAFECLONE_BUFFERSIZE; UConverter * someConverters [CLONETEST_CONVERTER_COUNT]; UConverter * someClonedConverters [CLONETEST_CONVERTER_COUNT]; UConverter * cnv; UErrorCode err = U_ZERO_ERROR; char *pCharBuffer; const char *pConstCharBuffer; const char *charBufferLimit = charBuffer + sizeof(charBuffer)/sizeof(*charBuffer); UChar uniBuffer [] = {0x0058, 0x0059, 0x005A}; /* "XYZ" */ UChar uniCharBuffer [20]; char charSourceBuffer [] = { 0x1b, 0x24, 0x42 }; const char *pCharSource = charSourceBuffer; const char *pCharSourceLimit = charSourceBuffer + sizeof(charSourceBuffer); UChar *pUCharTarget = uniCharBuffer; UChar *pUCharTargetLimit = uniCharBuffer + sizeof(uniCharBuffer)/sizeof(*uniCharBuffer); const UChar * pUniBuffer; const UChar *uniBufferLimit = uniBuffer + sizeof(uniBuffer)/sizeof(*uniBuffer); int index; /* one 'regular' & all the 'private stateful' converters */ someConverters[0] = ucnv_open("ibm-1047", &err); someConverters[1] = ucnv_open("ISO_2022", &err); someConverters[2] = ucnv_open("SCSU", &err); someConverters[3] = ucnv_open("HZ", &err); someConverters[4] = ucnv_open("lmbcs", &err); someConverters[5] = ucnv_open("ISCII,version=0",&err); someConverters[6] = ucnv_open("ISO_2022,locale=kr,version=1",&err); someConverters[7] = ucnv_open("ISO_2022,locale=jp,version=1",&err); someConverters[8] = ucnv_open("BOCU-1", &err); /* Check the various error & informational states: */ /* Null status - just returns NULL */ if (0 != ucnv_safeClone(someConverters[0], buffer[0], &bufferSize, 0)) { log_err("FAIL: Cloned converter failed to deal correctly with null status\n"); } /* error status - should return 0 & keep error the same */ err = U_MEMORY_ALLOCATION_ERROR; if (0 != ucnv_safeClone(someConverters[0], buffer[0], &bufferSize, &err) || err != U_MEMORY_ALLOCATION_ERROR) { log_err("FAIL: Cloned converter failed to deal correctly with incoming error status\n"); } err = U_ZERO_ERROR; /* Null buffer size pointer - just returns NULL & set error to U_ILLEGAL_ARGUMENT_ERROR*/ if (0 != ucnv_safeClone(someConverters[0], buffer[0], 0, &err) || err != U_ILLEGAL_ARGUMENT_ERROR) { log_err("FAIL: Cloned converter failed to deal correctly with null bufferSize pointer\n"); } err = U_ZERO_ERROR; /* buffer size pointer is 0 - fill in pbufferSize with a size */ bufferSize = 0; if (0 != ucnv_safeClone(someConverters[0], buffer[0], &bufferSize, &err) || U_FAILURE(err) || bufferSize <= 0) { log_err("FAIL: Cloned converter failed a sizing request ('preflighting')\n"); } /* Verify our define is large enough */ if (U_CNV_SAFECLONE_BUFFERSIZE < bufferSize) { log_err("FAIL: Pre-calculated buffer size is too small\n"); } /* Verify we can use this run-time calculated size */ if (0 == (cnv = ucnv_safeClone(someConverters[0], buffer[0], &bufferSize, &err)) || U_FAILURE(err)) { log_err("FAIL: Converter can't be cloned with run-time size\n"); } if (cnv) ucnv_close(cnv); /* size one byte too small - should allocate & let us know */ --bufferSize; if (0 == (cnv = ucnv_safeClone(someConverters[0], 0, &bufferSize, &err)) || err != U_SAFECLONE_ALLOCATED_WARNING) { log_err("FAIL: Cloned converter failed to deal correctly with too-small buffer size\n"); } if (cnv) ucnv_close(cnv); err = U_ZERO_ERROR; bufferSize = U_CNV_SAFECLONE_BUFFERSIZE; /* Null buffer pointer - return converter & set error to U_SAFECLONE_ALLOCATED_ERROR */ if (0 == (cnv = ucnv_safeClone(someConverters[0], 0, &bufferSize, &err)) || err != U_SAFECLONE_ALLOCATED_WARNING) { log_err("FAIL: Cloned converter failed to deal correctly with null buffer pointer\n"); } if (cnv) ucnv_close(cnv); err = U_ZERO_ERROR; /* Null converter - return NULL & set U_ILLEGAL_ARGUMENT_ERROR */ if (0 != ucnv_safeClone(0, buffer[0], &bufferSize, &err) || err != U_ILLEGAL_ARGUMENT_ERROR) { log_err("FAIL: Cloned converter failed to deal correctly with null converter pointer\n"); } err = U_ZERO_ERROR; /* Do these cloned converters work at all - shuffle UChars to chars & back again..*/ for (index = 0; index < CLONETEST_CONVERTER_COUNT; index++) { bufferSize = U_CNV_SAFECLONE_BUFFERSIZE; someClonedConverters[index] = ucnv_safeClone(someConverters[index], buffer[index], &bufferSize, &err); pCharBuffer = charBuffer; pUniBuffer = uniBuffer; ucnv_fromUnicode(someClonedConverters[index], &pCharBuffer, charBufferLimit, &pUniBuffer, uniBufferLimit, NULL, TRUE, &err); if(U_FAILURE(err)){ log_err("FAIL: cloned converter failed to do fromU conversion. Error: %s\n",u_errorName(err)); } ucnv_toUnicode(someClonedConverters[index], &pUCharTarget, pUCharTargetLimit, &pCharSource, pCharSourceLimit, NULL, TRUE, &err ); if(U_FAILURE(err)){ log_err("FAIL: cloned converter failed to do toU conversion. Error: %s\n",u_errorName(err)); } pConstCharBuffer = charBuffer; if (uniBuffer [0] != ucnv_getNextUChar(someClonedConverters[index], &pConstCharBuffer, pCharBuffer, &err)) { log_err("FAIL: Cloned converter failed to do conversion. Error: %s\n",u_errorName(err)); } ucnv_close(someClonedConverters[index]); ucnv_close(someConverters[index]); } } static void TestCCSID() { UConverter *cnv; UErrorCode errorCode; int32_t ccsids[]={ 37, 850, 943, 949, 950, 1047, 1252, 33722 }; int32_t i, ccsid; for(i=0; i<(int32_t)(sizeof(ccsids)/sizeof(int32_t)); ++i) { ccsid=ccsids[i]; errorCode=U_ZERO_ERROR; cnv=ucnv_openCCSID(ccsid, UCNV_IBM, &errorCode); if(U_FAILURE(errorCode)) { log_err("error: ucnv_openCCSID(%ld) failed (%s)\n", ccsid, u_errorName(errorCode)); continue; } if(ccsid!=ucnv_getCCSID(cnv, &errorCode)) { log_err("error: ucnv_getCCSID(ucnv_openCCSID(%ld))=%ld\n", ccsid, ucnv_getCCSID(cnv, &errorCode)); } if(UCNV_IBM!=ucnv_getPlatform(cnv, &errorCode)) { log_err("error: ucnv_getPlatform(ucnv_openCCSID(%ld))=%ld!=UCNV_IBM\n", ccsid, ucnv_getPlatform(cnv, &errorCode)); } ucnv_close(cnv); } } /* jitterbug 932: ucnv_convert() bugs --------------------------------------- */ /* CHUNK_SIZE defined in common\ucnv.c: */ #define CHUNK_SIZE 5*1024 static void bug1(void); static void bug2(void); static void bug3(void); static void TestJ932(void) { bug1(); /* Unicode intermediate buffer straddle bug */ bug2(); /* pre-flighting size incorrect caused by simple overflow */ bug3(); /* pre-flighting size incorrect caused by expansion overflow */ } /* * jitterbug 932: test chunking boundary conditions in int32_t ucnv_convert(const char *toConverterName, const char *fromConverterName, char *target, int32_t targetSize, const char *source, int32_t sourceSize, UErrorCode * err) * See discussions on the icu mailing list in * 2001-April with the subject "converter 'flush' question". * * Bug report and test code provided by Edward J. Batutis. */ static void bug1() { static char char_in[CHUNK_SIZE+32]; static char char_out[CHUNK_SIZE*2]; /* GB 18030 equivalent of U+10000 is 90308130 */ static const char test_seq[]={ (char)0x90u, 0x30, (char)0x81u, 0x30 }; UErrorCode err = U_ZERO_ERROR; int32_t i, test_seq_len = sizeof(test_seq); /* * causes straddle bug in Unicode intermediate buffer by sliding the test sequence forward * until the straddle bug appears. I didn't want to hard-code everything so this test could * be expanded - however this is the only type of straddle bug I can think of at the moment - * a high surrogate in the last position of the Unicode intermediate buffer. Apparently no * other Unicode sequences cause a bug since combining sequences are not supported by the * converters. */ for (i = test_seq_len; i >= 0; i--) { /* put character sequence into input buffer */ uprv_memset(char_in, 0x61, sizeof(char_in)); /* GB 18030 'a' */ uprv_memcpy(char_in + (CHUNK_SIZE - i), test_seq, test_seq_len); /* do the conversion */ ucnv_convert("us-ascii", /* out */ "gb18030", /* in */ char_out, sizeof(char_out), char_in, sizeof(char_in), &err); /* bug1: */ if (err == U_TRUNCATED_CHAR_FOUND) { /* this happens when surrogate pair straddles the intermediate buffer in * T_UConverter_fromCodepageToCodepage */ log_err("error j932 bug 1: expected success, got U_TRUNCATED_CHAR_FOUND\n"); } } } /* bug2: pre-flighting loop bug: simple overflow causes bug */ static void bug2() { /* US-ASCII "1234567890" */ static const char source[]={ 0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37, 0x38, 0x39 }; static const char sourceUTF8[]={ 0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, (char)0xef, (char)0x80, (char)0x80 }; static const char sourceUTF32[]={ 0x00, 0x00, 0x00, 0x30, 0x00, 0x00, 0x00, 0x31, 0x00, 0x00, 0x00, 0x32, 0x00, 0x00, 0x00, 0x33, 0x00, 0x00, 0x00, 0x34, 0x00, 0x00, 0x00, 0x35, 0x00, 0x00, 0x00, 0x36, 0x00, 0x00, 0x00, 0x37, 0x00, 0x00, 0x00, 0x38, 0x00, 0x00, (char)0xf0, 0x00}; static char target[5]; UErrorCode err = U_ZERO_ERROR; int32_t size; /* do the conversion */ size = ucnv_convert("iso-8859-1", /* out */ "us-ascii", /* in */ target, sizeof(target), source, sizeof(source), &err); if ( size != 10 ) { /* bug2: size is 5, should be 10 */ log_err("error j932 bug 2 us-ascii->iso-8859-1: got preflighting size %d instead of 10\n", size); } err = U_ZERO_ERROR; /* do the conversion */ size = ucnv_convert("UTF-32BE", /* out */ "UTF-8", /* in */ target, sizeof(target), sourceUTF8, sizeof(sourceUTF8), &err); if ( size != 32 ) { /* bug2: size is 5, should be 32 */ log_err("error j932 bug 2 UTF-8->UTF-32BE: got preflighting size %d instead of 32\n", size); } err = U_ZERO_ERROR; /* do the conversion */ size = ucnv_convert("UTF-8", /* out */ "UTF-32BE", /* in */ target, sizeof(target), sourceUTF32, sizeof(sourceUTF32), &err); if ( size != 12 ) { /* bug2: size is 5, should be 12 */ log_err("error j932 bug 2 UTF-32BE->UTF-8: got preflighting size %d instead of 12\n", size); } } /* * bug3: when the characters expand going from source to target codepage * you get bug3 in addition to bug2 */ static void bug3() { static char char_in[CHUNK_SIZE*4]; static char target[5]; UErrorCode err = U_ZERO_ERROR; int32_t size; /* * first get the buggy size from bug2 then * compare it to buggy size with an expansion */ uprv_memset(char_in, 0x61, sizeof(char_in)); /* US-ASCII 'a' */ /* do the conversion */ size = ucnv_convert("lmbcs", /* out */ "us-ascii", /* in */ target, sizeof(target), char_in, sizeof(char_in), &err); if ( size != sizeof(char_in) ) { /* * bug2: size is 0x2805 (CHUNK_SIZE*2+5 - maybe 5 is the size of the overflow buffer * in the converter?), should be CHUNK_SIZE*4 * * Markus 2001-05-18: 5 is the size of our target[] here, ucnv_convert() did not reset targetSize... */ log_err("error j932 bug 2/3a: expected preflighting size 0x%04x, got 0x%04x\n", sizeof(char_in), size); } /* * now do the conversion with expansion * ascii 0x08 expands to 0x0F 0x28 in lmbcs */ uprv_memset(char_in, 8, sizeof(char_in)); err = U_ZERO_ERROR; /* do the conversion */ size = ucnv_convert("lmbcs", /* out */ "us-ascii", /* in */ target, sizeof(target), char_in, sizeof(char_in), &err); /* expect 2X expansion */ if ( size != sizeof(char_in) * 2 ) { /* * bug3: * bug2 would lead us to expect 0x2805, but it isn't that either, it is 0x3c05: */ log_err("error j932 bug 3b: expected 0x%04x, got 0x%04x\n", sizeof(char_in) * 2, size); } } static void TestJ1968(void) { UErrorCode err = U_ZERO_ERROR; UConverter *cnv; char myConvName[] = "My really really really really really really really really really really really" " really really really really really really really really really really really" " really really really really really really really really long converter name"; UChar myConvNameU[sizeof(myConvName)]; u_charsToUChars(myConvName, myConvNameU, sizeof(myConvName)); err = U_ZERO_ERROR; myConvNameU[UCNV_MAX_CONVERTER_NAME_LENGTH+1] = 0; cnv = ucnv_openU(myConvNameU, &err); if (cnv || err != U_ILLEGAL_ARGUMENT_ERROR) { log_err("1U) Didn't get U_ILLEGAL_ARGUMENT_ERROR as expected %s\n", u_errorName(err)); } err = U_ZERO_ERROR; myConvNameU[UCNV_MAX_CONVERTER_NAME_LENGTH] = 0; cnv = ucnv_openU(myConvNameU, &err); if (cnv || err != U_ILLEGAL_ARGUMENT_ERROR) { log_err("2U) Didn't get U_ILLEGAL_ARGUMENT_ERROR as expected %s\n", u_errorName(err)); } err = U_ZERO_ERROR; myConvNameU[UCNV_MAX_CONVERTER_NAME_LENGTH-1] = 0; cnv = ucnv_openU(myConvNameU, &err); if (cnv || err != U_FILE_ACCESS_ERROR) { log_err("3U) Didn't get U_FILE_ACCESS_ERROR as expected %s\n", u_errorName(err)); } err = U_ZERO_ERROR; cnv = ucnv_open(myConvName, &err); if (cnv || err != U_ILLEGAL_ARGUMENT_ERROR) { log_err("1) Didn't get U_ILLEGAL_ARGUMENT_ERROR as expected %s\n", u_errorName(err)); } err = U_ZERO_ERROR; myConvName[UCNV_MAX_CONVERTER_NAME_LENGTH] = ','; cnv = ucnv_open(myConvName, &err); if (cnv || err != U_ILLEGAL_ARGUMENT_ERROR) { log_err("2) Didn't get U_ILLEGAL_ARGUMENT_ERROR as expected %s\n", u_errorName(err)); } err = U_ZERO_ERROR; myConvName[UCNV_MAX_CONVERTER_NAME_LENGTH-1] = ','; cnv = ucnv_open(myConvName, &err); if (cnv || err != U_FILE_ACCESS_ERROR) { log_err("3) Didn't get U_FILE_ACCESS_ERROR as expected %s\n", u_errorName(err)); } err = U_ZERO_ERROR; myConvName[UCNV_MAX_CONVERTER_NAME_LENGTH-1] = ','; strncpy(myConvName + UCNV_MAX_CONVERTER_NAME_LENGTH, "locale=", 7); cnv = ucnv_open(myConvName, &err); if (cnv || err != U_ILLEGAL_ARGUMENT_ERROR) { log_err("4) Didn't get U_ILLEGAL_ARGUMENT_ERROR as expected %s\n", u_errorName(err)); } /* The comma isn't really a part of the converter name. */ err = U_ZERO_ERROR; myConvName[UCNV_MAX_CONVERTER_NAME_LENGTH] = 0; cnv = ucnv_open(myConvName, &err); if (cnv || err != U_FILE_ACCESS_ERROR) { log_err("5) Didn't get U_FILE_ACCESS_ERROR as expected %s\n", u_errorName(err)); } err = U_ZERO_ERROR; myConvName[UCNV_MAX_CONVERTER_NAME_LENGTH-1] = ' '; cnv = ucnv_open(myConvName, &err); if (cnv || err != U_ILLEGAL_ARGUMENT_ERROR) { log_err("6) Didn't get U_ILLEGAL_ARGUMENT_ERROR as expected %s\n", u_errorName(err)); } err = U_ZERO_ERROR; myConvName[UCNV_MAX_CONVERTER_NAME_LENGTH-1] = 0; cnv = ucnv_open(myConvName, &err); if (cnv || err != U_FILE_ACCESS_ERROR) { log_err("7) Didn't get U_FILE_ACCESS_ERROR as expected %s\n", u_errorName(err)); } } static void testSwap(const char *name, UBool swap) { /* * Test Unicode text. * Contains characters that are the highest for some of the * tested conversions, to make sure that the ucnvmbcs.c code that modifies the * tables copies the entire tables. */ static const UChar text[]={ 0x61, 0xd, 0x62, 0xa, 0x4e00, 0x3000, 0xfffd, 0xa, 0x20, 0x85, 0xff5e, 0x7a }; UChar uNormal[32], uSwapped[32]; char normal[32], swapped[32]; const UChar *pcu; UChar *pu; char *pc; int32_t i, normalLength, swappedLength; UChar u; char c; const char *swappedName; UConverter *cnv, *swapCnv; UErrorCode errorCode; /* if the swap flag is FALSE, then the test encoding is not EBCDIC and must not swap */ /* open both the normal and the LF/NL-swapping converters */ strcpy(swapped, name); strcat(swapped, UCNV_SWAP_LFNL_OPTION_STRING); errorCode=U_ZERO_ERROR; swapCnv=ucnv_open(swapped, &errorCode); cnv=ucnv_open(name, &errorCode); if(U_FAILURE(errorCode)) { log_err("TestEBCDICSwapLFNL error: unable to open %s or %s (%s)\n", name, swapped, u_errorName(errorCode)); goto cleanup; } /* the name must contain the swap option if and only if we expect the converter to swap */ swappedName=ucnv_getName(swapCnv, &errorCode); if(U_FAILURE(errorCode)) { log_err("TestEBCDICSwapLFNL error: ucnv_getName(%s,swaplfnl) failed (%s)\n", name, u_errorName(errorCode)); goto cleanup; } pc=strstr(swappedName, UCNV_SWAP_LFNL_OPTION_STRING); if(swap != (pc!=NULL)) { log_err("TestEBCDICSwapLFNL error: ucnv_getName(%s,swaplfnl)=%s should (%d) contain 'swaplfnl'\n", name, swappedName, swap); goto cleanup; } /* convert to EBCDIC */ pcu=text; pc=normal; ucnv_fromUnicode(cnv, &pc, normal+LENGTHOF(normal), &pcu, text+LENGTHOF(text), NULL, TRUE, &errorCode); normalLength=(int32_t)(pc-normal); pcu=text; pc=swapped; ucnv_fromUnicode(swapCnv, &pc, swapped+LENGTHOF(swapped), &pcu, text+LENGTHOF(text), NULL, TRUE, &errorCode); swappedLength=(int32_t)(pc-swapped); if(U_FAILURE(errorCode)) { log_err("TestEBCDICSwapLFNL error converting to %s - (%s)\n", name, u_errorName(errorCode)); goto cleanup; } /* compare EBCDIC output */ if(normalLength!=swappedLength) { log_err("TestEBCDICSwapLFNL error converting to %s - output lengths %d vs. %d\n", name, normalLength, swappedLength); goto cleanup; } for(i=0; i