scuffed-code/icu4c/source/test/cintltst/udatatst.c

1869 lines
66 KiB
C

/********************************************************************
* COPYRIGHT:
* Copyright (c) 1998-2016, International Business Machines Corporation and
* others. All Rights Reserved.
********************************************************************/
/*
* File udatatst.c
*
* Modification History:
*
* Date Name Description
* 02/22/2000 Madhu Creation
******************************************************************************
*/
#include "unicode/utypes.h"
#include "unicode/putil.h"
#include "unicode/udata.h"
#include "unicode/ucal.h"
#include "unicode/uchar.h"
#include "unicode/ucnv.h"
#include "unicode/ures.h"
#include "unicode/ustring.h"
#include "unicode/uclean.h"
#include "cmemory.h"
#include "cstring.h"
#include "filestrm.h"
#include "udatamem.h"
#include "cintltst.h"
#include "ubrkimpl.h"
#include "toolutil.h" /* for uprv_fileExists() */
#include <stdlib.h>
#include <stdio.h>
/* includes for TestSwapData() */
#include "udataswp.h"
/* swapping implementations in common */
#include "uresdata.h"
#include "ucnv_io.h"
#include "uprops.h"
#include "ucase.h"
#include "ucol_imp.h"
#include "ucol_swp.h"
#include "ucnv_bld.h"
#include "sprpimpl.h"
#include "rbbidata.h"
/* swapping implementation in i18n */
#include "uspoof_impl.h"
U_CAPI int32_t U_EXPORT2
unorm2_swap(const UDataSwapper *ds,
const void *inData, int32_t length, void *outData,
UErrorCode *pErrorCode);
/* other definitions and prototypes */
#if !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION
static void TestUDataOpen(void);
static void TestUDataOpenChoiceDemo1(void);
static void TestUDataOpenChoiceDemo2(void);
static void TestUDataGetInfo(void);
static void TestUDataGetMemory(void);
static void TestErrorConditions(void);
static void TestAppData(void);
static void TestSwapData(void);
#endif
static void TestUDataSetAppData(void);
static void TestICUDataName(void);
static void PointerTableOfContents(void);
static void SetBadCommonData(void);
static void TestUDataFileAccess(void);
#if !UCONFIG_NO_FORMATTING && !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION
static void TestTZDataDir(void);
#endif
void addUDataTest(TestNode** root);
void
addUDataTest(TestNode** root)
{
#if !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION
addTest(root, &TestUDataOpen, "udatatst/TestUDataOpen" );
addTest(root, &TestUDataOpenChoiceDemo1, "udatatst/TestUDataOpenChoiceDemo1");
addTest(root, &TestUDataOpenChoiceDemo2, "udatatst/TestUDataOpenChoiceDemo2");
addTest(root, &TestUDataGetInfo, "udatatst/TestUDataGetInfo" );
addTest(root, &TestUDataGetMemory, "udatatst/TestUDataGetMemory" );
addTest(root, &TestErrorConditions, "udatatst/TestErrorConditions");
addTest(root, &TestAppData, "udatatst/TestAppData" );
addTest(root, &TestSwapData, "udatatst/TestSwapData" );
#endif
addTest(root, &TestUDataSetAppData, "udatatst/TestUDataSetAppData" );
addTest(root, &TestICUDataName, "udatatst/TestICUDataName" );
addTest(root, &PointerTableOfContents, "udatatst/PointerTableOfContents" );
addTest(root, &SetBadCommonData, "udatatst/SetBadCommonData" );
addTest(root, &TestUDataFileAccess, "udatatst/TestUDataFileAccess" );
#if !UCONFIG_NO_FORMATTING && !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION
addTest(root, &TestTZDataDir, "udatatst/TestTZDataDir" );
#endif
}
#if 0
static void lots_of_mallocs()
{
int q;
for(q=1;q<100;q++)
{
free(malloc(q));
malloc(q*2);
}
}
#endif
#if !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION
static void TestUDataOpen(){
UDataMemory *result;
UErrorCode status=U_ZERO_ERROR;
const char* memMap[][2]={
{"root", "res"},
{"cnvalias", "icu"},
{"unames", "icu"},
{"ibm-37_P100-1995", "cnv"}
};
const char* name = "test";
const char* type = "icu";
const char dirSepString[] = {U_FILE_SEP_CHAR, 0};
const char pathSepString[] = {U_PATH_SEP_CHAR, 0};
char* path=(char*)malloc(sizeof(char) * (strlen(ctest_dataOutDir())
+ strlen(U_ICUDATA_NAME)
+ strlen("/build/tmp/..")+1 ) );
char *icuDataFilePath = 0;
const char* testPath=loadTestData(&status);
if(U_FAILURE(status)) {
log_data_err("Could not load testdata.dat, status = %s\n", u_errorName(status));
free(path);
return;
}
/* lots_of_mallocs(); */
log_verbose("Testing udata_open(%s)\n", testPath);
result=udata_open(testPath, type, name, &status);
if(U_FAILURE(status)){
log_data_err("FAIL: udata_open() failed for path = %s, name=%s, type=%s, \n errorcode=%s\n", testPath, name, type, myErrorName(status));
} else {
log_verbose("PASS: udata_open worked\n");
udata_close(result);
}
{
strcat(strcpy(path, ctest_dataOutDir()), U_ICUDATA_NAME);
/* If the ICU system common data file is present in this confiugration,
* verify that udata_open can explicitly fetch items from it.
* If packaging mode == dll, the file may not exist. So, if the file is
* missing, skip this test without error.
*/
icuDataFilePath = (char *)uprv_malloc(strlen(path) + 10);
strcpy(icuDataFilePath, path);
strcat(icuDataFilePath, ".dat");
/* lots_of_mallocs(); */
if (uprv_fileExists(icuDataFilePath))
{
int i;
log_verbose("Testing udata_open() on %s\n", icuDataFilePath);
for(i=0; i<UPRV_LENGTHOF(memMap); i++){
/* lots_of_mallocs(); */
status=U_ZERO_ERROR;
result=udata_open(path, memMap[i][1], memMap[i][0], &status);
if(U_FAILURE(status)) {
log_data_err("FAIL: udata_open() failed for path = %s, name=%s, type=%s, \n errorcode=%s\n", path, memMap[i][0], memMap[i][1], myErrorName(status));
} else {
log_verbose("PASS: udata_open worked for path = %s, name=%s, type=%s\n", path, memMap[i][0], memMap[i][1]);
udata_close(result);
}
}
}
else
{
/* lots_of_mallocs(); */
log_verbose("Skipping tests of udata_open() on %s. File not present in this configuration.\n",
icuDataFilePath);
}
uprv_free(icuDataFilePath);
}
/* try again, adding /tmp */
{
strcpy(path, ctest_dataOutDir());
strcat(path, "tmp");
strcat(path, dirSepString);
strcat(path, U_ICUDATA_NAME);
/* If the ICU system common data file is present in this confiugration,
* verify that udata_open can explicitly fetch items from it.
* If packaging mode == dll, the file may not exist. So, if the file is
* missing, skip this test without error.
*/
icuDataFilePath = (char *)malloc(strlen(path) + 10);
strcpy(icuDataFilePath, path);
strcat(icuDataFilePath, ".dat");
/* lots_of_mallocs(); */
if (uprv_fileExists(icuDataFilePath))
{
int i;
log_verbose("Testing udata_open() on %s\n", icuDataFilePath);
for(i=0; i<UPRV_LENGTHOF(memMap); i++){
/* lots_of_mallocs(); */
status=U_ZERO_ERROR;
result=udata_open(path, memMap[i][1], memMap[i][0], &status);
if(U_FAILURE(status)) {
log_data_err("FAIL: udata_open() failed for path = %s, name=%s, type=%s, \n errorcode=%s\n", path, memMap[i][0], memMap[i][1], myErrorName(status));
} else {
log_verbose("PASS: udata_open worked for path = %s, name=%s, type=%s\n", path, memMap[i][0], memMap[i][1]);
udata_close(result);
}
}
}
else
{
/* lots_of_mallocs(); */
log_verbose("Skipping tests of udata_open() on %s. File not present in this configuration.\n",
icuDataFilePath);
}
}
free(icuDataFilePath);
icuDataFilePath = NULL;
/* lots_of_mallocs(); */
/* If the ICU individual files used to build the ICU system common data are
* present in this configuration,
* verify that udata_open can explicitly open them.
* These data files are present in the ICU data/build directory after a build
* completes. Tests are most commonly run with the data directory pointing
* back into this directory structure, but this is not required. Soooo, if
* the files are missing, skip this test without error.
*/
/* lots_of_mallocs(); */
icuDataFilePath = (char *)malloc(strlen(ctest_dataOutDir()) + 50);
strcpy(icuDataFilePath, ctest_dataOutDir());
strcat(icuDataFilePath, "build");
strcat(icuDataFilePath, dirSepString);
strcat(icuDataFilePath, U_ICUDATA_NAME);
strcat(icuDataFilePath, dirSepString);
strcat(icuDataFilePath, "cnvalias.icu");
/* lots_of_mallocs(); */
if (uprv_fileExists(icuDataFilePath))
{
int i;
log_verbose("%s exists, so..\n", icuDataFilePath);
strcpy(icuDataFilePath, ctest_dataOutDir());
strcat(icuDataFilePath, "build");
strcat(icuDataFilePath, dirSepString);
strcat(icuDataFilePath, U_ICUDATA_NAME);
log_verbose("Testing udata_open() on %s\n", icuDataFilePath);
for(i=0; i<UPRV_LENGTHOF(memMap); i++){
status=U_ZERO_ERROR;
result=udata_open(icuDataFilePath, memMap[i][1], memMap[i][0], &status);
if(U_FAILURE(status)) {
log_data_err("FAIL: udata_open() failed for path = %s, name=%s, type=%s, \n errorcode=%s\n", icuDataFilePath, memMap[i][0], memMap[i][1], myErrorName(status));
} else {
log_verbose("PASS: udata_open worked for path = %s, name=%s, type=%s\n", icuDataFilePath, memMap[i][0], memMap[i][1]);
udata_close(result);
}
}
}
else
{
log_verbose("Skipping tests of udata_open() on %s. File not present in this configuration.\n",
icuDataFilePath);
}
free(icuDataFilePath);
icuDataFilePath = NULL;
/*
* Test fallback file names for open of separate data files.
* With these params to udata_open:
* path = wherever/testdata
* type = typ
* name = nam
* these files will be tried first:
* wherever/testudata_nam.typ
* testudata_nam.typ
* A test data file named testudata_nam.typ exists for the purpose of testing this.
*/
log_verbose("Testing udata_open, with base_name.type style fallback to individual file.\n");
status = U_ZERO_ERROR;
result = udata_open( testPath, "typ", "nam", &status);
if (status != U_ZERO_ERROR) {
log_data_err("FAIL: udata_open( \"%s\", \"typ\", \"nam\") returned status %s\n", testPath, u_errorName(status));
}
udata_close(result);
free(icuDataFilePath);
/* This type of path is deprecated */
/*
* Another fallback test. Paths ending with a trailing directory separator
* take a slightly different code path, with the "base name" from the path
* being empty in the internal udata_open logic.
*/
/* log_verbose("Testing udata_open, with path containing a trailing directory separator.\n"); */
/* icuDataFilePath = (char *)malloc(strlen(u_getDataDirectory()) + 50); */
/* strcpy(icuDataFilePath, testPath); */
/* status = U_ZERO_ERROR; */
/* result = udata_open( icuDataFilePath, "cnv", "test1", &status); */
/* if (status != U_ZERO_ERROR) { */
/* log_err("FAIL: udata_open( \"%s\", \"cnv\", \"test1\") returned status %s\n", icuDataFilePath, u_errorName(status)); */
/* } */
/* udata_close(result); */
/* free(icuDataFilePath); */
log_verbose("Testing udata_open() with a non existing binary file\n");
result=udata_open("testdata", "tst", "nonexist", &status);
if(status==U_FILE_ACCESS_ERROR){
log_verbose("Opening udata_open with non-existing file handled correctly.\n");
status=U_ZERO_ERROR;
} else {
log_err("calling udata_open with non-existing file [testdata | nonexist.tst] not handled correctly\n. Expected: U_FILE_ACCESS_ERROR, Got: %s\n", myErrorName(status));
if(U_SUCCESS(status)) {
udata_close(result);
}
}
if(result != NULL){
log_err("calling udata_open with non-existing file didn't return a null value\n");
} else {
log_verbose("calling udat_open with non-existing file returned null as expected\n");
}
/*
* Try opening data with absurdly long path and name, to trigger buffer size
* overflow handling code.
*/
{
char longTestPath[1024]; /* Implementation goes to heap at length of 128. */
char longName[1024];
/* Try a very long nonexistent directory path.
* udata_open should still succeed. Opening with the path will fail,
* then fall back to skipping the directory portion of the path.
*/
log_verbose("Testing udata_open() with really long names\n");
longTestPath[0] = 0;
strcat(longTestPath, "bogus_directory_name");
while (strlen(longTestPath) < 500) {
strcat(longTestPath, dirSepString);
strcat(longTestPath, "bogus_directory_name");
}
strcat(longTestPath, pathSepString);
strcat(longTestPath, testPath);
result=udata_open(longTestPath, type, name, &status);
if(U_FAILURE(status)){
log_data_err("FAIL: udata_open() failed for path = %s\n name=%s, type=%s, \n errorcode=%s\n",
longTestPath, name, type, myErrorName(status));
} else {
log_verbose("PASS: udata_open worked\n");
udata_close(result);
}
/* Try a very long name. Won't open, but shouldn't blow up.
*/
longName[0] = 0;
while (strlen(longName) < 500) {
strcat(longName, name);
strcat(longName, "_");
}
strcat(longName, dirSepString);
strcat(longName, name);
result=udata_open(longTestPath, type, longName, &status);
if (status != U_FILE_ACCESS_ERROR) {
log_data_err("FAIL: udata_open() failed for path = %s\n name=%s, type=%s, \n errorcode=%s\n",
longTestPath, longName, type, myErrorName(status));
}
udata_close(result);
}
free(path);
}
#endif
typedef struct {
uint16_t headerSize;
uint8_t magic1, magic2;
UDataInfo info;
char padding[8];
uint32_t count, reserved;
/*
const struct {
const char *const name;
const void *const data;
} toc[1];
*/
int32_t fakeNameAndData[4];
} ICU_COMMON_Data_Header;
static const ICU_COMMON_Data_Header gEmptyHeader = {
32, /* headerSize */
0xda, /* magic1, (see struct MappedData in udata.c) */
0x27, /* magic2 */
{ /*UDataInfo */
sizeof(UDataInfo), /* size */
0, /* reserved */
#if U_IS_BIG_ENDIAN
1,
#else
0,
#endif
U_CHARSET_FAMILY,
sizeof(UChar),
0, /* reserved */
{ /* data format identifier */
0x43, 0x6d, 0x6e, 0x44}, /* "CmnD" */
{1, 0, 0, 0}, /* format version major, minor, milli, micro */
{0, 0, 0, 0} /* dataVersion */
},
{0,0,0,0,0,0,0,0}, /* Padding[8] */
0, /* count */
0, /* Reserved */
{ /* TOC structure */
/* { */
0 , 0 , 0, 0 /* name and data entries. Count says there are none, */
/* but put one in just in case. */
/* } */
}
};
static void TestUDataSetAppData(){
/* UDataMemory *dataItem;*/
UErrorCode status=U_ZERO_ERROR;
/*
* First we try some monkey business and try to do bad things.
*/
status=U_ZERO_ERROR;
udata_setAppData("appData1", NULL, &status);
if (status != U_ILLEGAL_ARGUMENT_ERROR) {
log_err("FAIL: TestUDataSetAppData(): udata_setAppData(\"appData1\", NULL, status) should have failed."
" It returned status of %s\n", u_errorName(status));
return;
}
/* The following call should fail.
If the following works with a bad UErrorCode, then later calls to appData1 should fail. */
udata_setAppData("appData1", &gEmptyHeader, &status);
/*
* Got testdata.dat into memory, now we try setAppData using the memory image.
*/
status=U_ZERO_ERROR;
udata_setAppData("appData1", &gEmptyHeader, &status);
if (status != U_ZERO_ERROR) {
log_err("FAIL: TestUDataSetAppData(): udata_setAppData(\"appData1\", fileBuf, status) "
" returned status of %s\n", u_errorName(status));
return;
}
udata_setAppData("appData2", &gEmptyHeader, &status);
if (status != U_ZERO_ERROR) {
log_err("FAIL: TestUDataSetAppData(): udata_setAppData(\"appData2\", fileBuf, status) "
" returned status of %s\n", u_errorName(status));
return;
}
/* If we try to setAppData with the same name a second time, we should get a
* a using default warning.
*/
udata_setAppData("appData2", &gEmptyHeader, &status);
if (status != U_USING_DEFAULT_WARNING) {
log_err("FAIL: TestUDataSetAppData(): udata_setAppData(\"appData2\", fileBuf, status) "
" returned status of %s, expected U_USING_DEFAULT_WARNING.\n", u_errorName(status));
}
/** It is no longer correct to use udata_setAppData to change the
package of a contained item.
dataItem = udata_open("appData1", "res", "te_IN", &status); **/
}
static char *safeGetICUDataDirectory() {
const char *dataDir = u_getDataDirectory(); /* Returned string vanashes with u_cleanup */
char *retStr = NULL;
if (dataDir != NULL) {
retStr = (char *)malloc(strlen(dataDir)+1);
strcpy(retStr, dataDir);
}
return retStr;
}
static void TestUDataFileAccess(){
UErrorCode status;
char *icuDataDir;
icuDataDir = safeGetICUDataDirectory(); /* save icu data dir, so we can put it back
* after doing u_cleanup(). */
/** UDATA_NO_FILES, ICU does not access the file system for data loading. */
status=U_ZERO_ERROR;
u_cleanup();
udata_setFileAccess(UDATA_NO_FILES,&status);
u_init(&status);
if(U_FAILURE(status) && *icuDataDir == 0){
log_data_err("udata_setFileAccess(UDATA_NO_FILES) failed with ICU_DATA=\"\" err=%s\n", u_errorName(status));
}
/** UDATA_ONLY_PACKAGES, ICU only loads data from packages, not from single files. */
status=U_ZERO_ERROR;
u_cleanup();
udata_setFileAccess(UDATA_ONLY_PACKAGES,&status);
u_init(&status);
/** UDATA_PACKAGES_FIRST, ICU loads data from packages first, and only from single files
if the data cannot be found in a package. */
status=U_ZERO_ERROR;
u_cleanup();
udata_setFileAccess(UDATA_PACKAGES_FIRST,&status);
u_init(&status);
/** UDATA_FILES_FIRST, ICU looks for data in single files first, then in packages. (default) */
status=U_ZERO_ERROR;
u_cleanup();
udata_setFileAccess(UDATA_FILES_FIRST,&status);
u_init(&status);
/** An alias for the default access mode. */
status=U_ZERO_ERROR;
u_cleanup();
udata_setFileAccess(UDATA_DEFAULT_ACCESS,&status);
u_setDataDirectory(icuDataDir);
u_init(&status);
if(U_FAILURE(status)){
log_err_status(status, "%s\n", u_errorName(status));
}
free(icuDataDir);
ctest_resetICU();
}
static UBool U_CALLCONV
isAcceptable1(void *context,
const char *type, const char *name,
const UDataInfo *pInfo) {
if( pInfo->size>=20 &&
pInfo->isBigEndian==U_IS_BIG_ENDIAN &&
pInfo->charsetFamily==U_CHARSET_FAMILY &&
pInfo->dataFormat[0]==0x43 && /* dataFormat="CvAl" */
pInfo->dataFormat[1]==0x76 &&
pInfo->dataFormat[2]==0x41 &&
pInfo->dataFormat[3]==0x6c &&
pInfo->formatVersion[0]==3 )
{
log_verbose("The data from \"%s.%s\" IS acceptable using the verifing function isAcceptable1()\n", name, type);
return TRUE;
} else {
log_verbose("The data from \"%s.%s\" IS NOT acceptable using the verifing function isAcceptable1():-\n"
"\tsize = %d\n"
"\tisBigEndian = %d\n"
"\tcharsetFamily = %d\n"
"\tformatVersion[0] = %d\n"
"\tdataVersion[0] = %d\n"
"\tdataFormat = %c%c%c%c\n",
name, type, pInfo->size, pInfo->isBigEndian, pInfo->charsetFamily, pInfo->formatVersion[0],
pInfo->dataVersion[0], pInfo->dataFormat[0], pInfo->dataFormat[1], pInfo->dataFormat[2],
pInfo->dataFormat[3]);
log_verbose("Call another verifing function to accept the data\n");
return FALSE;
}
}
static UBool U_CALLCONV
isAcceptable2(void *context,
const char *type, const char *name,
const UDataInfo *pInfo){
UVersionInfo unicodeVersion;
u_getUnicodeVersion(unicodeVersion);
if( pInfo->size>=20 &&
pInfo->isBigEndian==U_IS_BIG_ENDIAN &&
pInfo->charsetFamily==U_CHARSET_FAMILY &&
pInfo->dataFormat[0]==0x75 && /* dataFormat="unam" */
pInfo->dataFormat[1]==0x6e &&
pInfo->dataFormat[2]==0x61 &&
pInfo->dataFormat[3]==0x6d &&
pInfo->formatVersion[0]==1 &&
pInfo->dataVersion[0]==unicodeVersion[0] )
{
log_verbose("The data from \"%s.%s\" IS acceptable using the verifing function isAcceptable2()\n", name, type);
return TRUE;
} else {
log_verbose("The data from \"%s.%s\" IS NOT acceptable using the verifing function isAcceptable2()\n", name, type);
return FALSE;
}
}
static UBool U_CALLCONV
isAcceptable3(void *context,
const char *type, const char *name,
const UDataInfo *pInfo){
if( pInfo->size>=20 &&
pInfo->isBigEndian==U_IS_BIG_ENDIAN &&
pInfo->charsetFamily==U_CHARSET_FAMILY &&
pInfo->dataFormat[0]==0x54 && /* dataFormat="test" */
pInfo->dataFormat[1]==0x65 &&
pInfo->dataFormat[2]==0x73 &&
pInfo->dataFormat[3]==0x74 &&
pInfo->formatVersion[0]==1 &&
pInfo->dataVersion[0]==1 ) {
log_verbose("The data from \"%s.%s\" IS acceptable using the verifing function isAcceptable3()\n", name, type);
return TRUE;
} else {
log_verbose("The data from \"%s.%s\" IS NOT acceptable using the verifing function isAcceptable3()\n", name, type);
return FALSE;
}
}
#if !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION
static void TestUDataOpenChoiceDemo1() {
UDataMemory *result;
UErrorCode status=U_ZERO_ERROR;
const char* name[]={
"cnvalias",
"unames",
"test",
"nam"
};
const char* type="icu";
const char* testPath="testdata";
const char* fullTestDataPath = loadTestData(&status);
if(U_FAILURE(status)) {
log_data_err("Could not load testdata.dat, status = %s\n", u_errorName(status));
return;
}
result=udata_openChoice(NULL, "icu", name[0], isAcceptable1, NULL, &status);
if(U_FAILURE(status)){
log_data_err("FAIL: udata_openChoice() failed name=%s, type=%s, \n errorcode=%s\n", name[0], type, myErrorName(status));
} else {
log_verbose("PASS: udata_openChoice worked\n");
udata_close(result);
}
status=U_ZERO_ERROR;
result=udata_openChoice(NULL, type, name[1], isAcceptable1, NULL, &status);
if(U_FAILURE(status)){
status=U_ZERO_ERROR;
result=udata_openChoice(NULL, type, name[1], isAcceptable2, NULL, &status);
if(U_FAILURE(status)){
log_data_err("FAIL: udata_openChoice() failed name=%s, type=%s, \n errorcode=%s\n", name[1], type, myErrorName(status));
}
}
else {
log_err("FAIL: udata_openChoice() unexpectedly passed. name=%s, type=%s, \n errorcode=%s\n", name[1], type, myErrorName(status));
}
if(U_SUCCESS(status)){
udata_close(result);
}
status=U_ZERO_ERROR;
result=udata_openChoice(testPath, type, name[2], isAcceptable1, NULL, &status);
if(U_FAILURE(status)){
status=U_ZERO_ERROR;
result=udata_openChoice(testPath, type, name[2], isAcceptable3, NULL, &status);
if(U_FAILURE(status)){
log_data_err("FAIL: udata_openChoice() failed path=%s name=%s, type=%s, \n errorcode=%s\n", testPath, name[2], type, myErrorName(status));
}
}
else {
log_err("FAIL: udata_openChoice() unexpectedly passed. name=%s, type=%s, \n errorcode=%s\n", name[2], type, myErrorName(status));
}
if(U_SUCCESS(status)){
udata_close(result);
}
status=U_ZERO_ERROR;
type="typ";
result=udata_openChoice(fullTestDataPath, type, name[3], isAcceptable1, NULL, &status);
if(status != U_INVALID_FORMAT_ERROR){
log_err("FAIL: udata_openChoice() did not fail as expected. name=%s, type=%s, \n errorcode=%s\n", name[3], type, myErrorName(status));
}
status=U_USELESS_COLLATOR_ERROR;
result=udata_openChoice(fullTestDataPath, type, name[3], isAcceptable1, NULL, &status);
if(status != U_USELESS_COLLATOR_ERROR){
log_err("FAIL: udata_openChoice() did not fail as expected. name=%s, type=%s, \n errorcode=%s\n", name[3], type, myErrorName(status));
}
}
static UBool U_CALLCONV
isAcceptable(void *context,
const char *type, const char *name,
const UDataInfo *pInfo){
if( pInfo->size>=20 &&
pInfo->isBigEndian==U_IS_BIG_ENDIAN &&
pInfo->charsetFamily==U_CHARSET_FAMILY &&
pInfo->dataFormat[0]==0x54 && /* dataFormat="test" */
pInfo->dataFormat[1]==0x65 &&
pInfo->dataFormat[2]==0x73 &&
pInfo->dataFormat[3]==0x74 &&
pInfo->formatVersion[0]==1 &&
pInfo->dataVersion[0]==1 &&
*((int*)context) == 2 ) {
log_verbose("The data from\"%s.%s\" IS acceptable using the verifing function isAcceptable()\n", name, type);
return TRUE;
} else {
log_verbose("The data from \"%s.%s\" IS NOT acceptable using the verifing function isAcceptable()\n", name, type);
return FALSE;
}
}
/* This test checks to see if the isAcceptable function is being called correctly. */
static void TestUDataOpenChoiceDemo2() {
UDataMemory *result;
UErrorCode status=U_ZERO_ERROR;
int i;
int p=2;
const char* name="test";
const char* type="icu";
const char* path = loadTestData(&status);
if(U_FAILURE(status)) {
log_data_err("Could not load testdata.dat, status = %s\n", u_errorName(status));
return;
}
result=udata_openChoice(path, type, name, isAcceptable, &p, &status);
if(U_FAILURE(status)){
log_data_err("failed to load data at p=%s t=%s n=%s, isAcceptable", path, type, name);
}
if(U_SUCCESS(status) ) {
udata_close(result);
}
p=0;
for(i=0;i<2; i++){
result=udata_openChoice(path, type, name, isAcceptable, &p, &status);
if(p<2) {
if(U_FAILURE(status) && status==U_INVALID_FORMAT_ERROR){
log_verbose("Loads the data but rejects it as expected %s\n", myErrorName(status));
status=U_ZERO_ERROR;
p++;
}
else {
log_data_err("FAIL: failed to either load the data or to reject the loaded data. ERROR=%s\n", myErrorName(status) );
}
}
else if(p == 2) {
if(U_FAILURE(status)) {
log_data_err("FAIL: failed to load the data and accept it. ERROR=%s\n", myErrorName(status) );
}
else {
log_verbose("Loads the data and accepts it for p==2 as expected\n");
udata_close(result);
}
}
}
}
static void TestUDataGetInfo() {
UDataMemory *result;
/* UDataInfo cf. udata.h */
static UDataInfo dataInfo={
30, /*sizeof(UDataInfo),*/
0,
U_IS_BIG_ENDIAN,
U_CHARSET_FAMILY,
sizeof(UChar),
0,
{0x54, 0x65, 0x73, 0x74}, /* dataFormat="Test" */
{9, 0, 0, 0}, /* formatVersion */
{4, 0, 0, 0} /* dataVersion */
};
UErrorCode status=U_ZERO_ERROR;
const char* name="cnvalias";
const char* name2="test";
const char* type="icu";
const char* testPath=loadTestData(&status);
if(U_FAILURE(status)) {
log_data_err("Could not load testdata.dat, status = %s\n", u_errorName(status));
return;
}
log_verbose("Testing udata_getInfo() for cnvalias.icu\n");
result=udata_open(NULL, "icu", name, &status);
if(U_FAILURE(status)){
log_data_err("FAIL: udata_open() failed for path = NULL, name=%s, type=%s, \n errorcode=%s\n", name, type, myErrorName(status));
return;
}
udata_getInfo(result, &dataInfo);
if(dataInfo.size==20 && dataInfo.size!=30 &&
dataInfo.isBigEndian==U_IS_BIG_ENDIAN &&
dataInfo.charsetFamily==U_CHARSET_FAMILY &&
dataInfo.dataFormat[0]==0x43 && dataInfo.dataFormat[0]!=0x54 && /* dataFormat="CvAl" and not "Test". The values are set for cnvalias.dat*/
dataInfo.dataFormat[1]==0x76 && dataInfo.dataFormat[1]!=0x65 &&
dataInfo.dataFormat[2]==0x41 && dataInfo.dataFormat[2]!=0x73 &&
dataInfo.dataFormat[3]==0x6c && dataInfo.dataFormat[3]!=0x74 &&
dataInfo.formatVersion[0]!=9 && /*formatVersion is also set to the one for cnvalias*/
dataInfo.dataVersion[0]!=4 && /*dataVersion*/
dataInfo.dataVersion[1]!=0 ){
log_verbose("PASS: udata_getInfo() filled in the right values\n");
} else {
log_err("FAIL: udata_getInfo() filled in the wrong values\n");
}
udata_close(result);
log_verbose("Testing udata_getInfo() for test.icu\n");
result=udata_open(testPath, type, name2, &status);
if(U_FAILURE(status)) {
log_data_err("FAIL: udata_open() failed for path=%s name2=%s, type=%s, \n errorcode=%s\n", testPath, name2, type, myErrorName(status));
return;
}
udata_getInfo(result, &dataInfo);
if(dataInfo.size==20 &&
dataInfo.isBigEndian==U_IS_BIG_ENDIAN &&
dataInfo.charsetFamily==U_CHARSET_FAMILY &&
dataInfo.dataFormat[0]==0x54 && /* dataFormat="Test". The values are set for test.dat*/
dataInfo.dataFormat[1]==0x65 &&
dataInfo.dataFormat[2]==0x73 &&
dataInfo.dataFormat[3]==0x74 &&
dataInfo.formatVersion[0]==1 && /*formatVersion is also set to the one for test*/
dataInfo.dataVersion[0]==1 && /*dataVersion*/
dataInfo.dataVersion[1]==0 )
{
log_verbose("PASS: udata_getInfo() filled in the right values\n");
} else {
log_err("FAIL: udata_getInfo() filled in the wrong values\n");
}
udata_close(result);
}
static void TestUDataGetMemory() {
UDataMemory *result;
const int32_t *table=NULL;
uint16_t* intValue=0;
UErrorCode status=U_ZERO_ERROR;
const char* name="cnvalias";
const char* type;
const char* name2="test";
const char* testPath = loadTestData(&status);
if(U_FAILURE(status)) {
log_data_err("Could not load testdata.dat, status = %s\n", u_errorName(status));
return;
}
type="icu";
log_verbose("Testing udata_getMemory() for \"cnvalias.icu\"\n");
result=udata_openChoice(NULL, type, name, isAcceptable1, NULL, &status);
if(U_FAILURE(status)){
log_data_err("FAIL: udata_openChoice() failed for name=%s, type=%s, \n errorcode=%s\n", name, type, myErrorName(status));
return;
}
table=(const int32_t *)udata_getMemory(result);
/* The alias table may list more converters than what's actually available now. [grhoten] */
if(ucnv_countAvailable() > table[1]) /*???*/
log_err("FAIL: udata_getMemory() failed ucnv_countAvailable returned = %d, expected = %d\n", ucnv_countAvailable(), table[1+2*(*table)]);
udata_close(result);
type="icu";
log_verbose("Testing udata_getMemory for \"test.icu\"()\n");
result=udata_openChoice(testPath, type, name2, isAcceptable3, NULL, &status);
if(U_FAILURE(status)){
log_data_err("FAIL: udata_openChoice() failed for path=%s name=%s, type=%s, \n errorcode=%s\n", testPath, name2, type, myErrorName(status));
return;
}
intValue=(uint16_t *)udata_getMemory(result);
/*printf("%d ..... %s", *(intValue), intValue+1));*/
if( *intValue != 2000 || strcmp((char*)(intValue+1), "YEAR") != 0 )
log_err("FAIL: udata_getMemory() failed: intValue :- Expected:2000 Got:%d \n\tstringValue:- Expected:YEAR Got:%s\n", *intValue, (intValue+1));
udata_close(result);
}
static void TestErrorConditions(){
UDataMemory *result=NULL;
UErrorCode status=U_ZERO_ERROR;
uint16_t* intValue=0;
static UDataInfo dataInfo={
30, /*sizeof(UDataInfo),*/
0,
U_IS_BIG_ENDIAN,
U_CHARSET_FAMILY,
sizeof(UChar),
0,
{0x54, 0x65, 0x73, 0x74}, /* dataFormat="Test" */
{9, 0, 0, 0}, /* formatVersion */
{4, 0, 0, 0} /* dataVersion */
};
const char* name = "test";
const char* type="icu";
const char *testPath = loadTestData(&status);
if(U_FAILURE(status)) {
log_data_err("Could not load testdata.dat, status = %s\n", u_errorName(status));
return;
}
status = U_ILLEGAL_ARGUMENT_ERROR;
/*Try udata_open with status != U_ZERO_ERROR*/
log_verbose("Testing udata_open() with status != U_ZERO_ERROR\n");
result=udata_open(testPath, type, name, &status);
if(result != NULL){
log_data_err("FAIL: udata_open() is supposed to fail for path = %s, name=%s, type=%s, \n errorcode !=U_ZERO_ERROR\n", testPath, name, type);
udata_close(result);
} else {
log_verbose("PASS: udata_open with errorCode != U_ZERO_ERROR failed as expected\n");
}
/*Try udata_open with data name=NULL*/
log_verbose("Testing udata_open() with data name=NULL\n");
status=U_ZERO_ERROR;
result=udata_open(testPath, type, NULL, &status);
if(U_FAILURE(status)){
if(status != U_ILLEGAL_ARGUMENT_ERROR || result != NULL){
log_err("FAIL: udata_open() with name=NULL should return NULL and errocode U_ILLEGAL_ARGUMENT_ERROR, GOT: errorcode=%s\n", myErrorName(status));
}else{
log_verbose("PASS: udata_open with name=NULL failed as expected and errorcode = %s as expected\n", myErrorName(status));
}
}else{
log_err("FAIL: udata_open() with data name=NULL is supposed to fail for path = %s, name=NULL type=%s errorcode=U_ZERO_ERROR \n", testPath, type);
udata_close(result);
}
/*Try udata_openChoice with status != U_ZERO_ERROR*/
log_verbose("Testing udata_openChoice() with status != U_ZERO_ERROR\n");
status=U_ILLEGAL_ARGUMENT_ERROR;
result=udata_openChoice(testPath, type, name, isAcceptable3, NULL, &status);
if(result != NULL){
log_err("FAIL: udata_openChoice() is supposed to fail for path = %s, name=%s, type=%s, \n errorcode != U_ZERO_ERROR\n", testPath, name, type);
udata_close(result);
} else {
log_verbose("PASS: udata_openChoice() with errorCode != U_ZERO_ERROR failed as expected\n");
}
/*Try udata_open with data name=NULL*/
log_verbose("Testing udata_openChoice() with data name=NULL\n");
status=U_ZERO_ERROR;
result=udata_openChoice(testPath, type, NULL, isAcceptable3, NULL, &status);
if(U_FAILURE(status)){
if(status != U_ILLEGAL_ARGUMENT_ERROR || result != NULL){
log_err("FAIL: udata_openChoice() with name=NULL should return NULL and errocode U_ILLEGAL_ARGUMENT_ERROR, GOT: errorcode=%s\n", myErrorName(status));
}else{
log_verbose("PASS: udata_openChoice with name=NULL failed as expected and errorcode = %s as expected\n", myErrorName(status));
}
}else{
log_err("FAIL: udata_openChoice() with data name=NULL is supposed to fail for path = %s, name=NULL type=%s errorcode=U_ZERO_ERROR \n", testPath, type);
udata_close(result);
}
/*Try udata_getMemory with UDataMemory=NULL*/
log_verbose("Testing udata_getMemory with UDataMemory=NULL\n");
intValue=(uint16_t*)udata_getMemory(NULL);
if(intValue != NULL){
log_err("FAIL: udata_getMemory with UDataMemory = NULL is supposed to fail\n");
}
/*Try udata_getInfo with UDataMemory=NULL*/
status=U_ZERO_ERROR;
udata_getInfo(NULL, &dataInfo);
if(dataInfo.size != 0){
log_err("FAIL : udata_getInfo with UDataMemory = NULL us supposed to fail\n");
}
/*Try udata_openChoice with a non existing binary file*/
log_verbose("Testing udata_openChoice() with a non existing binary file\n");
result=udata_openChoice(testPath, "tst", "nonexist", isAcceptable3, NULL, &status);
if(status==U_FILE_ACCESS_ERROR){
log_verbose("Opening udata_openChoice with non-existing file handled correctly.\n");
status=U_ZERO_ERROR;
} else {
log_err("calling udata_open with non-existing file not handled correctly\n. Expected: U_FILE_ACCESS_ERROR, Got: %s\n", myErrorName(status));
if(U_SUCCESS(status)) {
udata_close(result);
}
}
if(result != NULL){
log_err("calling udata_open with non-existing file didn't return a null value\n");
} else {
log_verbose("calling udat_open with non-existing file returned null as expected\n");
}
}
/* Test whether apps and ICU can each have their own root.res */
static void TestAppData()
{
UResourceBundle *icu, *app;
UResourceBundle *tmp = NULL;
UResourceBundle *tmp2 = NULL;
const UChar *appString;
const UChar *icuString;
int32_t len;
UErrorCode status = U_ZERO_ERROR;
char testMsgBuf[256];
const char* testPath=loadTestData(&status);
if(U_FAILURE(status)) {
log_data_err("Could not load testdata.dat, status = %s\n", u_errorName(status));
return;
}
icu = ures_open(NULL, "root", &status);
if(U_FAILURE(status))
{
log_data_err("%s:%d: Couldn't open root ICU bundle- %s", __FILE__, __LINE__, u_errorName(status));
return;
}
/* log_info("Open icu root: %s size_%d\n", u_errorName(status), ures_getSize(icu)); */
status = U_ZERO_ERROR;
app = ures_open(testPath, "root", &status);
if(U_FAILURE(status))
{
log_data_err("%s:%d: Couldn't open app ICU bundle [%s]- %s", __FILE__, __LINE__, testPath, u_errorName(status));
return;
}
/* log_info("Open app: %s, size %d\n", u_errorName(status), ures_getSize(app)); */
tmp = ures_getByKey(icu, "Version", tmp, &status);
if(U_FAILURE(status))
{
log_err("%s:%d: Couldn't get Version string from ICU root bundle- %s", __FILE__, __LINE__, u_errorName(status));
return;
}
icuString = ures_getString(tmp, &len, &status);
if(U_FAILURE(status))
{
log_err("%s:%d: Couldn't get string from Version string from ICU root bundle- %s", __FILE__, __LINE__, u_errorName(status));
return;
}
/* log_info("icuString=%p - %s\n", icuString, austrdup(icuString)); */
tmp2 = ures_getByKey(app, "Version", tmp2, &status);
if(U_FAILURE(status))
{
log_err("%s:%d: Couldn't get Version string from App root bundle- %s", __FILE__, __LINE__, u_errorName(status));
return;
}
appString = ures_getString(tmp2, &len, &status);
if(U_FAILURE(status))
{
log_err("%s:%d: Couldn't get string from Version string from App root bundle- %s", __FILE__, __LINE__, u_errorName(status));
return;
}
/* log_info("appString=%p - %s\n", appString, austrdup(appString)); */
if(!u_strcmp(icuString, appString))
{
log_err("%s:%d: Error! Expected ICU and App root version strings to be DIFFERENT but they are both %s and %s\n", __FILE__, __LINE__, austrdup(icuString),
austrdup(appString));
}
else
{
log_verbose("%s:%d: appstr=%s, icustr=%s\n", __FILE__,
__LINE__, u_austrcpy(testMsgBuf, appString), u_austrcpy(testMsgBuf, icuString));
}
ures_close(tmp);
ures_close(tmp2);
ures_close(icu);
ures_close(app);
}
#endif
static void TestICUDataName()
{
UVersionInfo icuVersion;
char expectDataName[20];
unsigned int expectLen = 8;
char typeChar = '?';
/* Print out the version # we have .. */
log_verbose("utypes.h says U_ICUDATA_NAME = %s\n", U_ICUDATA_NAME);
/* Build up the version # we expect to get */
u_getVersion(icuVersion);
switch(U_CHARSET_FAMILY)
{
case U_ASCII_FAMILY:
switch((int)U_IS_BIG_ENDIAN)
{
case 1:
typeChar = 'b';
break;
case 0:
typeChar = 'l';
break;
default:
log_err("Expected 1 or 0 for U_IS_BIG_ENDIAN, got %d!\n", (int)U_IS_BIG_ENDIAN);
/* return; */
}
break;
case U_EBCDIC_FAMILY:
typeChar = 'e';
break;
}
/* Only major number is needed. */
sprintf(expectDataName, "%s%d%c",
"icudt",
(int)icuVersion[0],
typeChar);
log_verbose("Expected: %s\n", expectDataName);
if(uprv_strlen(expectDataName) != expectLen)
{
log_err("*Expected* length is wrong (test err?), should be %d is %d\n",
expectLen, uprv_strlen(expectDataName));
}
if(uprv_strlen(U_ICUDATA_NAME) != expectLen)
{
log_err("U_ICUDATA_NAME length should be %d is %d\n",
expectLen, uprv_strlen(U_ICUDATA_NAME));
}
if(uprv_strcmp(U_ICUDATA_NAME, expectDataName))
{
log_err("U_ICUDATA_NAME should be %s but is %s\n",
expectDataName, U_ICUDATA_NAME);
}
/* ICUDATA_NAME comes from the build system on *nix */
#ifdef ICUDATA_NAME
if(uprv_strcmp(U_ICUDATA_NAME, ICUDATA_NAME))
{
log_err("ICUDATA_NAME and U_ICUDATA_NAME don't match: "
"ICUDATA_NAME=%s, U_ICUDATA_NAME=%s. Check configure.in, icudefs.mk.in, utypes.h...\n", ICUDATA_NAME, U_ICUDATA_NAME);
}
else
{
log_verbose("ICUDATA_NAME=%s (from icudefs.mk), U_ICUDATA_NAME=%s (from utypes.h)\n", ICUDATA_NAME, U_ICUDATA_NAME);
}
#endif
}
/* test data swapping ------------------------------------------------------- */
#if U_PLATFORM == U_PF_OS400
/* See comments in genccode.c on when this special implementation can be removed. */
static const struct {
double bogus;
const char *bytes;
} gOffsetTOCAppDataItem1={ 0.0, /* alignment bytes */
"\x00\x14" /* sizeof(UDataInfo) *//* MappedData { */
"\xda"
"\x27" /* } */
"\x00\x14" /* sizeof(UDataInfo) *//* UDataInfo { */
"\0\0"
"\1" /* U_IS_BIG_ENDIAN */
"\1" /* U_CHARSET_FAMILY */
"\2" /* U_SIZEOF_WHAR_T */
"\0"
"\x31\x31\x31\x31"
"\0\0\0\0"
"\0\0\0\0" /* } */
};
#else
static const struct {
double bogus;
MappedData bytes1;
UDataInfo bytes2;
uint8_t bytes3;
} gOffsetTOCAppDataItem1={
0.0, /* alignment bytes */
{ sizeof(UDataInfo), 0xda, 0x27 }, /* MappedData */
{sizeof(UDataInfo),
0,
U_IS_BIG_ENDIAN,
U_CHARSET_FAMILY,
sizeof(UChar),
0,
{0x31, 0x31, 0x31, 0x31}, /* dataFormat="1111" */
{0, 0, 0, 0}, /* formatVersion */
{0, 0, 0, 0}} /* dataVersion */
};
#endif
static const UChar gOffsetTOCGarbage[] = { /* "I have been very naughty!" */
0x49, 0x20, 0x68, 0x61, 0x76, 0x65, 0x20, 0x62, 0x65, 0x65, 0x6E,
0x20, 0x76, 0x65, 0x72, 0x79, 0x20, 0x6E, 0x61, 0x75, 0x67, 0x68, 0x74, 0x79, 0x21
};
/* Original source: icu/source/tools/genccode */
static const struct {
uint16_t headerSize;
uint8_t magic1, magic2;
UDataInfo info;
char padding[8];
uint32_t count, reserved;
const struct {
const char *const name;
const void *const data;
} toc[3];
} gOffsetTOCAppData_dat = {
32, /* headerSize */
0xda, /* magic1, (see struct MappedData in udata.c) */
0x27, /* magic2 */
{ /*UDataInfo */
sizeof(UDataInfo), /* size */
0, /* reserved */
U_IS_BIG_ENDIAN,
U_CHARSET_FAMILY,
sizeof(UChar),
0, /* reserved */
{ /* data format identifier */
0x54, 0x6f, 0x43, 0x50}, /* "ToCP" */
{1, 0, 0, 0}, /* format version major, minor, milli, micro */
{0, 0, 0, 0} /* dataVersion */
},
{0,0,0,0,0,0,0,0}, /* Padding[8] */
3, /* count */
0, /* Reserved */
{ /* TOC structure */
{ "OffsetTOCAppData/a/b", &gOffsetTOCAppDataItem1 },
{ "OffsetTOCAppData/gOffsetTOCAppDataItem1", &gOffsetTOCAppDataItem1 },
{ "OffsetTOCAppData/gOffsetTOCGarbage", &gOffsetTOCGarbage }
}
};
/* Unfortunately, dictionaries are in a C++ header */
U_CAPI int32_t U_EXPORT2
udict_swap(const UDataSwapper *ds, const void *inData, int32_t length, void *outData, UErrorCode *pErrorCode);
/* test cases for maximum data swapping code coverage */
static const struct {
const char *name, *type;
UDataSwapFn *swapFn;
} swapCases[]={
/* resource bundles */
/* resource bundle with many data types */
{"*testtypes", "res", ures_swap},
/* resource bundle with collation data */
{"ja", "res", ures_swap},
/* resource bundle with options-only collation data */
{"ru", "res", ures_swap},
{"el", "res", ures_swap},
/* ICU's root */
{"root", "res", ures_swap},
/* Test a 32-bit key table. This is large. */
{"*testtable32", "res", ures_swap},
/* ICU 4.2 resource bundle - data format 1.2 (little-endian ASCII) */
{"*old_l_testtypes", "res", ures_swap},
/* same for big-endian EBCDIC */
{"*old_e_testtypes", "res", ures_swap},
#if !UCONFIG_NO_COLLATION
/* standalone collation data files */
{"ucadata", "icu", ucol_swap},
#if 0
/* Starting with ICU 53, the "inverse UCA" data is integrated into ucadata.icu. */
{"invuca", "icu", ucol_swapInverseUCA},
#endif
#endif
#if !UCONFIG_NO_LEGACY_CONVERSION
/* conversion table files */
/* SBCS conversion table file without extension */
{"ibm-913_P100-2000", "cnv", ucnv_swap},
/* EBCDIC_STATEFUL conversion table file with extension */
{"ibm-1390_P110-2003", "cnv", ucnv_swap},
/* DBCS extension-only conversion table file */
{"ibm-16684_P110-2003", "cnv", ucnv_swap},
/* EUC-TW (3-byte) conversion table file without extension */
{"ibm-964_P110-1999", "cnv", ucnv_swap},
/* GB 18030 (4-byte) conversion table file without extension */
{"gb18030", "cnv", ucnv_swap},
/* MBCS conversion table file with extension */
{"*test4x", "cnv", ucnv_swap},
/*
* MBCS conversion table file without extension,
* to test swapping and preflighting of UTF-8-friendly mbcsIndex[].
*/
{"jisx-212", "cnv", ucnv_swap},
#endif
#if !UCONFIG_NO_CONVERSION
/* alias table */
{"cnvalias", "icu", ucnv_swapAliases},
#endif
#if !UCONFIG_NO_IDNA
{"rfc3491", "spp", usprep_swap},
#endif
#if !UCONFIG_NO_BREAK_ITERATION
{"char", "brk", ubrk_swap},
{"thaidict", "dict",udict_swap},
#endif
#if 0
/*
* Starting with ICU 4.8, the Unicode property (value) aliases data
* is hardcoded in the ICU4C common library.
* The swapper was moved to the toolutil library for swapping for ICU4J.
*/
/* Unicode properties */
{"pnames", "icu", upname_swap},
#endif
#if 0
/*
* Starting with ICU4C 3.4, the core Unicode properties files
* (uprops.icu, ucase.icu, ubidi.icu, unorm.icu)
* are hardcoded in the common DLL and therefore not included
* in the data package any more.
* Their swapping code is moved from the common DLL to the icuswap tool so that
* we need not jump through hoops (like adding snapshots of these files
* to testdata) for code coverage in tests.
* See Jitterbug 4497.
*
* ICU4C 4.4 adds normalization data files again, e.g., nfkc.nrm.
*/
{"uprops", "icu", uprops_swap},
{"ucase", "icu", ucase_swap},
{"ubidi", "icu", ubidi_swap},
#endif
#if !UCONFIG_NO_NORMALIZATION && !UCONFIG_ONLY_COLLATION
{"nfkc", "nrm", unorm2_swap},
#if !UCONFIG_NO_REGULAR_EXPRESSIONS
{"confusables", "cfu", uspoof_swap}, /* spoof data missing without regex */
#endif
#endif
{"unames", "icu", uchar_swapNames}
/* the last item should not be #if'ed so that it can reliably omit the last comma */
};
/* Large enough for the largest swappable data item. */
#define SWAP_BUFFER_SIZE 1800000
static void U_CALLCONV
printError(void *context, const char *fmt, va_list args) {
vlog_info("[swap] ", fmt, args);
log_err("\n"); /* Register error */
}
static void
TestSwapCase(UDataMemory *pData, const char *name,
UDataSwapFn *swapFn,
uint8_t *buffer, uint8_t *buffer2) {
UDataSwapper *ds;
const void *inData, *inHeader;
int32_t length, dataLength, length2, headerLength;
UErrorCode errorCode;
UErrorCode badStatus;
UBool inEndian, oppositeEndian;
uint8_t inCharset, oppositeCharset;
/* First we check that swapFn handles failures as expected. */
errorCode = U_UNSUPPORTED_ERROR;
length = swapFn(NULL, NULL, 0, buffer, &errorCode);
if (length != 0 || errorCode != U_UNSUPPORTED_ERROR) {
log_err("%s() did not fail as expected - %s\n", name, u_errorName(errorCode));
}
errorCode = U_ZERO_ERROR;
length = swapFn(NULL, NULL, 0, buffer, &errorCode);
if (length != 0 || errorCode != U_ILLEGAL_ARGUMENT_ERROR) {
log_err("%s() did not fail as expected with bad arguments - %s\n", name, u_errorName(errorCode));
}
/* Continue with the rest of the tests. */
errorCode = U_ZERO_ERROR;
inData=udata_getMemory(pData);
/*
* get the data length if possible, to verify that swapping and preflighting
* handles the entire data
*/
dataLength=udata_getLength(pData);
/*
* get the header and its length
* all of the swap implementation functions require the header to be included
*/
inHeader=udata_getRawMemory(pData);
headerLength=(int32_t)((const char *)inData-(const char *)inHeader);
/* first swap to opposite endianness but same charset family */
errorCode=U_ZERO_ERROR;
ds=udata_openSwapperForInputData(inHeader, headerLength,
!U_IS_BIG_ENDIAN, U_CHARSET_FAMILY, &errorCode);
if(U_FAILURE(errorCode)) {
log_err("udata_openSwapperForInputData(%s->!isBig+same charset) failed - %s\n",
name, u_errorName(errorCode));
return;
}
inEndian=ds->inIsBigEndian;
inCharset=ds->inCharset;
oppositeEndian=!inEndian;
oppositeCharset= inCharset==U_ASCII_FAMILY ? U_EBCDIC_FAMILY : U_ASCII_FAMILY;
/* make this test work with data files that are built for a different platform */
if(inEndian!=U_IS_BIG_ENDIAN || inCharset!=U_CHARSET_FAMILY) {
udata_closeSwapper(ds);
ds=udata_openSwapper(inEndian, inCharset, oppositeEndian, inCharset, &errorCode);
if(U_FAILURE(errorCode)) {
log_err("udata_openSwapper(%s->!isBig+same charset) failed - %s\n",
name, u_errorName(errorCode));
return;
}
}
/*
Check error checking of swappable data not specific to this swapper.
This should always fail.
*/
badStatus = U_ZERO_ERROR;
length=swapFn(ds, &gOffsetTOCAppData_dat, -1, NULL, &badStatus);
if(badStatus != U_UNSUPPORTED_ERROR) {
log_err("swapFn(%s->!isBig+same charset) unexpectedly succeeded on bad data - %s\n",
name, u_errorName(errorCode));
udata_closeSwapper(ds);
return;
}
/* Now allow errors to be printed */
ds->printError=printError;
/* preflight the length */
length=swapFn(ds, inHeader, -1, NULL, &errorCode);
if(U_FAILURE(errorCode)) {
log_err("swapFn(preflight %s->!isBig+same charset) failed - %s\n",
name, u_errorName(errorCode));
udata_closeSwapper(ds);
return;
}
/* compare the preflighted length against the data length */
if(dataLength>=0 && (length+15)<(headerLength+dataLength)) {
log_err("swapFn(preflight %s->!isBig+same charset) length too small: %d < data length %d\n",
name, length, (headerLength+dataLength));
udata_closeSwapper(ds);
return;
}
/* swap, not in-place */
length2=swapFn(ds, inHeader, length, buffer, &errorCode);
udata_closeSwapper(ds);
if(U_FAILURE(errorCode)) {
log_err("swapFn(%s->!isBig+same charset) failed - %s\n",
name, u_errorName(errorCode));
return;
}
/* compare the swap length against the preflighted length */
if(length2!=length) {
log_err("swapFn(%s->!isBig+same charset) length differs from preflighting: %d != preflighted %d\n",
name, length2, length);
return;
}
/* next swap to opposite charset family */
ds=udata_openSwapper(oppositeEndian, inCharset,
oppositeEndian, oppositeCharset,
&errorCode);
if(U_FAILURE(errorCode)) {
log_err("udata_openSwapper(%s->!isBig+other charset) failed - %s\n",
name, u_errorName(errorCode));
return;
}
ds->printError=printError;
/* swap in-place */
length2=swapFn(ds, buffer, length, buffer, &errorCode);
udata_closeSwapper(ds);
if(U_FAILURE(errorCode)) {
log_err("swapFn(%s->!isBig+other charset) failed - %s\n",
name, u_errorName(errorCode));
return;
}
/* compare the swap length against the original length */
if(length2!=length) {
log_err("swapFn(%s->!isBig+other charset) length differs from original: %d != original %d\n",
name, length2, length);
return;
}
/* finally swap to original platform values */
ds=udata_openSwapper(oppositeEndian, oppositeCharset,
inEndian, inCharset,
&errorCode);
if(U_FAILURE(errorCode)) {
log_err("udata_openSwapper(%s->back to original) failed - %s\n",
name, u_errorName(errorCode));
return;
}
ds->printError=printError;
/* swap, not in-place */
length2=swapFn(ds, buffer, length, buffer2, &errorCode);
udata_closeSwapper(ds);
if(U_FAILURE(errorCode)) {
log_err("swapFn(%s->back to original) failed - %s\n",
name, u_errorName(errorCode));
return;
}
/* compare the swap length against the original length */
if(length2!=length) {
log_err("swapFn(%s->back to original) length differs from original: %d != original %d\n",
name, length2, length);
return;
}
/* compare the final contents with the original */
if(0!=uprv_memcmp(inHeader, buffer2, length)) {
const uint8_t *original;
uint8_t diff[8];
int32_t i, j;
log_err("swapFn(%s->back to original) contents differs from original\n",
name);
/* find the first difference */
original=(const uint8_t *)inHeader;
for(i=0; i<length && original[i]==buffer2[i]; ++i) {}
/* find the next byte that is the same */
for(j=i+1; j<length && original[j]!=buffer2[j]; ++j) {}
log_info(" difference at index %d=0x%x, until index %d=0x%x\n", i, i, j, j);
/* round down to the last 4-boundary for better result output */
i&=~3;
log_info("showing bytes from index %d=0x%x (length %d=0x%x):\n", i, i, length, length);
/* print 8 bytes but limit to the buffer contents */
length2=i+sizeof(diff);
if(length2>length) {
length2=length;
}
/* print the original bytes */
uprv_memset(diff, 0, sizeof(diff));
for(j=i; j<length2; ++j) {
diff[j-i]=original[j];
}
log_info(" original: %02x %02x %02x %02x %02x %02x %02x %02x\n",
diff[0], diff[1], diff[2], diff[3], diff[4], diff[5], diff[6], diff[7]);
/* print the swapped bytes */
uprv_memset(diff, 0, sizeof(diff));
for(j=i; j<length2; ++j) {
diff[j-i]=buffer2[j];
}
log_info(" swapped: %02x %02x %02x %02x %02x %02x %02x %02x\n",
diff[0], diff[1], diff[2], diff[3], diff[4], diff[5], diff[6], diff[7]);
}
}
static void U_CALLCONV
printErrorToString(void *context, const char *fmt, va_list args) {
vsprintf((char *)context, fmt, args);
}
#if !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION
static void
TestSwapData() {
char name[100];
UDataSwapper *ds;
UDataMemory *pData;
uint8_t *buffer;
const char *pkg, *nm, *testPath;
UErrorCode errorCode = U_ZERO_ERROR;
int32_t i;
buffer=(uint8_t *)malloc(2*SWAP_BUFFER_SIZE);
if(buffer==NULL) {
log_err("unable to allocate %d bytes\n", 2*SWAP_BUFFER_SIZE);
return;
}
testPath=loadTestData(&errorCode);
if(U_FAILURE(errorCode)) {
log_data_err("Could not load testdata.dat, status = %s\n", u_errorName(errorCode));
}
/* Test that printError works as expected. */
errorCode=U_USELESS_COLLATOR_ERROR;
ds=udata_openSwapper(U_IS_BIG_ENDIAN, U_ASCII_FAMILY,
!U_IS_BIG_ENDIAN, U_ASCII_FAMILY,
&errorCode);
if (ds != NULL || errorCode != U_USELESS_COLLATOR_ERROR) {
log_err("udata_openSwapper should have returned NULL with bad argument\n", name);
}
errorCode=U_ZERO_ERROR;
ds=udata_openSwapper(U_IS_BIG_ENDIAN, U_ASCII_FAMILY,
!U_IS_BIG_ENDIAN, U_ASCII_FAMILY,
&errorCode);
ds->printError=printErrorToString;
ds->printErrorContext=name;
udata_printError(ds, "This %s a %s", "is", "test");
udata_closeSwapper(ds);
if (strcmp(name, "This is a test") != 0) {
log_err("udata_printError can't properly print error messages. Got = %s\n", name);
}
errorCode = U_USELESS_COLLATOR_ERROR;
ds=udata_openSwapperForInputData(NULL, 0,
!U_IS_BIG_ENDIAN, U_ASCII_FAMILY,
&errorCode);
if (ds != NULL || errorCode != U_USELESS_COLLATOR_ERROR) {
log_err("udata_openSwapperForInputData should have returned NULL with bad argument\n", name);
}
errorCode=U_ZERO_ERROR;
ds=udata_openSwapperForInputData(NULL, 0,
!U_IS_BIG_ENDIAN, U_ASCII_FAMILY,
&errorCode);
if (ds != NULL || errorCode != U_ILLEGAL_ARGUMENT_ERROR) {
log_err("udata_openSwapperForInputData should have returned NULL with bad argument\n", name);
}
errorCode=U_ZERO_ERROR;
memset(buffer, 0, sizeof(2*SWAP_BUFFER_SIZE));
ds=udata_openSwapperForInputData(buffer, 2*SWAP_BUFFER_SIZE,
!U_IS_BIG_ENDIAN, U_ASCII_FAMILY,
&errorCode);
if (ds != NULL || errorCode != U_UNSUPPORTED_ERROR) {
log_err("udata_openSwapperForInputData should have returned NULL with bad argument\n", name);
}
errorCode=U_ZERO_ERROR;
/* Test argument checking. ucol_swap is normally tested via ures_swap, and isn't normally called directly. */
#if !UCONFIG_NO_COLLATION
ucol_swap(NULL, NULL, -1, NULL, &errorCode);
if (errorCode != U_ILLEGAL_ARGUMENT_ERROR) {
log_err("ucol_swap did not fail as expected\n", name);
}
errorCode=U_ZERO_ERROR;
#endif
for(i=0; i<UPRV_LENGTHOF(swapCases); ++i) {
/* build the name for logging */
errorCode=U_ZERO_ERROR;
if(swapCases[i].name[0]=='*') {
pkg=testPath;
nm=swapCases[i].name+1;
uprv_strcpy(name, "testdata");
} else if (uprv_strcmp(swapCases[i].type, "brk")==0
|| uprv_strcmp(swapCases[i].type, "dict")==0) {
pkg=U_ICUDATA_BRKITR;
nm=swapCases[i].name;
uprv_strcpy(name, U_ICUDATA_BRKITR);
#if !UCONFIG_NO_COLLATION
} else if (uprv_strcmp(swapCases[i].name, "ucadata")==0
|| uprv_strcmp(swapCases[i].name, "invuca")==0) {
pkg=U_ICUDATA_COLL;
nm=swapCases[i].name;
uprv_strcpy(name, U_ICUDATA_COLL);
#endif /* !UCONFIG_NO_COLLATION */
} else {
pkg=NULL;
nm=swapCases[i].name;
uprv_strcpy(name, "NULL");
}
uprv_strcat(name, "/");
uprv_strcat(name, nm);
uprv_strcat(name, ".");
uprv_strcat(name, swapCases[i].type);
pData=udata_open(pkg, swapCases[i].type, nm, &errorCode);
if(U_SUCCESS(errorCode)) {
TestSwapCase(pData, name, swapCases[i].swapFn, buffer, buffer+SWAP_BUFFER_SIZE);
udata_close(pData);
} else {
log_data_err("udata_open(%s) failed - %s\n",
name, u_errorName(errorCode));
}
}
free(buffer);
}
#endif
static void PointerTableOfContents() {
UDataMemory *dataItem;
UErrorCode status=U_ZERO_ERROR;
/*
* Got testdata.dat into memory, now we try setAppData using the memory image.
*/
status=U_ZERO_ERROR;
udata_setAppData("OffsetTOCAppData", &gOffsetTOCAppData_dat, &status);
if (status != U_ZERO_ERROR) {
log_err("FAIL: TestUDataSetAppData(): udata_setAppData(\"appData1\", fileBuf, status) \n"
" returned status of %s\n", u_errorName(status));
return;
}
dataItem = udata_open("OffsetTOCAppData", "", "gOffsetTOCAppDataItem1", &status);
if (U_FAILURE(status)) {
log_err("FAIL: gOffsetTOCAppDataItem1 could not be opened. status = %s\n", u_errorName(status));
}
if (udata_getMemory(dataItem) != NULL) {
log_verbose("FAIL: udata_getMemory(dataItem) passed\n");
}
else {
log_err("FAIL: udata_getMemory returned NULL\n", u_errorName(status));
}
udata_close(dataItem);
dataItem = udata_open("OffsetTOCAppData-a", "", "b", &status);
if (U_FAILURE(status)) {
log_err("FAIL: gOffsetTOCAppDataItem1 in tree \"a\" could not be opened. status = %s\n", u_errorName(status));
}
if (udata_getMemory(dataItem) != NULL) {
log_verbose("FAIL: udata_getMemory(dataItem) in tree \"a\" passed\n");
}
else {
log_err("FAIL: udata_getMemory returned NULL\n", u_errorName(status));
}
udata_close(dataItem);
dataItem = udata_open("OffsetTOCAppData", "", "gOffsetTOCGarbage", &status);
if (U_SUCCESS(status)) {
log_err("FAIL: gOffsetTOCGarbage should not be opened. status = %s\n", u_errorName(status));
}
dataItem = udata_open("OffsetTOCAppData", "", "gOffsetTOCNonExistent", &status);
if (U_SUCCESS(status)) {
log_err("FAIL: gOffsetTOCNonExistent should not be found. status = %s\n", u_errorName(status));
}
}
static void SetBadCommonData(void) {
/* It's difficult to test that udata_setCommonData really works within the test framework.
So we just test that foolish people can't do bad things. */
UErrorCode status;
char badBuffer[sizeof(gOffsetTOCAppData_dat)];
memset(badBuffer, 0, sizeof(badBuffer));
strcpy(badBuffer, "Hello! I'm not good data.");
/* Check that we don't do anything */
status = U_FILE_ACCESS_ERROR;
udata_setCommonData(&gOffsetTOCAppData_dat, &status);
if (status != U_FILE_ACCESS_ERROR) {
log_err("FAIL: udata_setCommonData changed the failure code.\n");
}
/* Check that we fail correctly */
status = U_ZERO_ERROR;
udata_setCommonData(NULL, &status);
if (status != U_ILLEGAL_ARGUMENT_ERROR) {
log_err("FAIL: udata_setCommonData did not fail with bad arguments.\n");
}
/* Check that we verify that the data isn't bad */
status = U_ZERO_ERROR;
udata_setAppData("invalid path", badBuffer, &status);
if (status != U_INVALID_FORMAT_ERROR) {
log_err("FAIL: udata_setAppData doesn't verify data validity.\n");
}
}
// Check the override loading of time zone .res files from a specified path
//
// Hand testing notes:
// 1. Run this test with the environment variable set. The following should induce faiures:
// ICU_TIMEZONE_FILES_DIR=../testdata/out/build LD_LIBRARY_PATH=../../lib:../../stubdata:../../tools/ctestfw:$LD_LIBRARY_PATH ./cintltst /udatatst/TestTZDataDir
// 2. Build ICU with with U_TIMEZONE_FILES_DIR defined. This should also induce failures.
// CPPFLAGS=-DU_TIMEZONE_FILES_DIR\=`pwd`/test/testdata/out/testdata ./runConfigureICU Linux
// make check
static void TestTZDataDir(void) {
#if !UCONFIG_NO_FORMATTING
UErrorCode status = U_ZERO_ERROR;
const char *tzDataVersion;
const char *testDataPath;
// Verify that default ICU time zone data version is something newer than 2014a.
tzDataVersion = ucal_getTZDataVersion(&status);
// printf("tz data version is %s\n", tzDataVersion);
if (U_FAILURE(status)) {
log_data_err("Failed call to ucal_getTZDataVersion - %s\n", u_errorName(status));
return;
} else if (strcmp("2014a", tzDataVersion) == 0) {
log_err("File %s:%d - expected something newer than time zone data 2014a.\n", __FILE__, __LINE__, tzDataVersion);
}
testDataPath = loadTestData(&status);
// The path produced by loadTestData() will look something like
// whatever/.../testdata/out/testdata
// The test data puts an old (2014a) version of the time zone data there.
// Switch ICU to the testdata version of zoneinfo64.res, which is verison 2014a.
ctest_resetICU();
u_setTimeZoneFilesDirectory(testDataPath, &status);
tzDataVersion = ucal_getTZDataVersion(&status);
if (strcmp("2014a", tzDataVersion) != 0) {
log_err("File %s:%d - expected \"2014a\"; actual \"%s\"\n", __FILE__, __LINE__, tzDataVersion);
}
ctest_resetICU(); // Return ICU to using its standard tz data.
tzDataVersion = ucal_getTZDataVersion(&status);
// printf("tz data version is %s\n", tzDataVersion);
if (strcmp("2014a", tzDataVersion) == 0) {
log_err("File %s:%d - expected something newer than time zone data 2014a.\n", __FILE__, __LINE__, tzDataVersion);
}
#endif
}