2003-05-15 18:28:41 +00:00
/********************************************************************
2009-03-09 20:39:13 +00:00
* Copyright ( c ) 1997 - 2009 International Business Machines
2008-09-18 23:07:16 +00:00
* Corporation and others . All Rights Reserved .
2003-05-15 18:28:41 +00:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */
2008-01-05 01:27:56 +00:00
/*****************************************************************************
2003-05-15 18:28:41 +00:00
*
* File CAPITEST . C
*
* Modification History :
* Name Description
* Madhu Katragadda Ported for C API
2008-09-18 23:07:16 +00:00
* Brian Rower Added TestOpenVsOpenRules
2008-01-05 01:27:56 +00:00
* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * *
2003-05-15 18:28:41 +00:00
*/ /* C API TEST For COLLATOR */
# include "unicode/utypes.h"
# if !UCONFIG_NO_COLLATION
# include <stdio.h>
# include <stdlib.h>
# include <string.h>
# include "unicode/uloc.h"
2008-09-18 23:07:16 +00:00
# include "unicode/ulocdata.h"
2003-05-15 18:28:41 +00:00
# include "unicode/ustring.h"
# include "unicode/ures.h"
# include "unicode/ucoleitr.h"
# include "cintltst.h"
# include "capitst.h"
# include "ccolltst.h"
2004-10-18 02:43:33 +00:00
# include "putilimp.h"
2009-03-09 20:39:13 +00:00
# include "cstring.h"
2003-05-15 18:28:41 +00:00
static void TestAttribute ( void ) ;
2007-06-13 22:53:28 +00:00
static void TestDefault ( void ) ;
2008-11-17 20:27:25 +00:00
static void TestDefaultKeyword ( void ) ;
2004-11-11 23:34:58 +00:00
int TestBufferSize ( ) ; /* defined in "colutil.c" */
2003-05-15 18:28:41 +00:00
2003-09-13 00:07:12 +00:00
2003-05-15 18:28:41 +00:00
/* next two function is modified from "i18n/ucol.cpp" to avoid include "ucol_imp.h" */
static void uprv_appendByteToHexString ( char * dst , uint8_t val ) {
uint32_t len = ( uint32_t ) strlen ( dst ) ;
sprintf ( dst + len , " %02X " , val ) ;
}
static char * U_EXPORT2 ucol_sortKeyToString ( const UCollator * coll , const uint8_t * sortkey , char * buffer , uint32_t * len ) {
int32_t strength = UCOL_PRIMARY ;
uint32_t res_size = 0 ;
UBool doneCase = FALSE ;
char * current = buffer ;
const uint8_t * currentSk = sortkey ;
2003-06-04 21:11:41 +00:00
UErrorCode error_code = U_ZERO_ERROR ;
2003-05-15 18:28:41 +00:00
strcpy ( current , " [ " ) ;
while ( strength < = UCOL_QUATERNARY & & strength < = ucol_getAttribute ( coll , UCOL_STRENGTH , & error_code ) ) {
2003-06-04 21:11:41 +00:00
if ( U_FAILURE ( error_code ) ) {
log_err ( " ucol_getAttribute returned error: %s \n " , u_errorName ( error_code ) ) ;
}
2003-05-15 18:28:41 +00:00
if ( strength > UCOL_PRIMARY ) {
strcat ( current , " . " ) ;
2001-11-13 22:55:05 +00:00
}
2003-05-15 18:28:41 +00:00
while ( * currentSk ! = 0x01 & & * currentSk ! = 0x00 ) { /* print a level */
uprv_appendByteToHexString ( current , * currentSk + + ) ;
strcat ( current , " " ) ;
2001-11-13 22:55:05 +00:00
}
2003-05-15 18:28:41 +00:00
if ( ucol_getAttribute ( coll , UCOL_CASE_LEVEL , & error_code ) = = UCOL_ON & & strength = = UCOL_SECONDARY & & doneCase = = FALSE ) {
doneCase = TRUE ;
} else if ( ucol_getAttribute ( coll , UCOL_CASE_LEVEL , & error_code ) = = UCOL_OFF | | doneCase = = TRUE | | strength ! = UCOL_SECONDARY ) {
strength + + ;
2001-11-13 22:55:05 +00:00
}
2003-06-04 21:11:41 +00:00
if ( U_FAILURE ( error_code ) ) {
log_err ( " ucol_getAttribute returned error: %s \n " , u_errorName ( error_code ) ) ;
}
2003-05-15 18:28:41 +00:00
uprv_appendByteToHexString ( current , * currentSk + + ) ; /* This should print '01' */
if ( strength = = UCOL_QUATERNARY & & ucol_getAttribute ( coll , UCOL_ALTERNATE_HANDLING , & error_code ) = = UCOL_NON_IGNORABLE ) {
break ;
}
}
if ( ucol_getAttribute ( coll , UCOL_STRENGTH , & error_code ) = = UCOL_IDENTICAL ) {
strcat ( current , " . " ) ;
while ( * currentSk ! = 0 ) {
uprv_appendByteToHexString ( current , * currentSk + + ) ;
strcat ( current , " " ) ;
}
uprv_appendByteToHexString ( current , * currentSk + + ) ;
}
2003-06-04 21:11:41 +00:00
if ( U_FAILURE ( error_code ) ) {
log_err ( " ucol_getAttribute returned error: %s \n " , u_errorName ( error_code ) ) ;
}
2003-05-15 18:28:41 +00:00
strcat ( current , " ] " ) ;
if ( res_size > * len ) {
return NULL ;
}
return buffer ;
}
/* end of avoid include "ucol_imp.h" */
void addCollAPITest ( TestNode * * root )
{
/* WEIVTODO: return tests here */
addTest ( root , & TestProperty , " tscoll/capitst/TestProperty " ) ;
addTest ( root , & TestRuleBasedColl , " tscoll/capitst/TestRuleBasedColl " ) ;
addTest ( root , & TestCompare , " tscoll/capitst/TestCompare " ) ;
addTest ( root , & TestSortKey , " tscoll/capitst/TestSortKey " ) ;
addTest ( root , & TestHashCode , " tscoll/capitst/TestHashCode " ) ;
addTest ( root , & TestElemIter , " tscoll/capitst/TestElemIter " ) ;
addTest ( root , & TestGetAll , " tscoll/capitst/TestGetAll " ) ;
/*addTest(root, &TestGetDefaultRules, "tscoll/capitst/TestGetDefaultRules");*/
addTest ( root , & TestDecomposition , " tscoll/capitst/TestDecomposition " ) ;
addTest ( root , & TestSafeClone , " tscoll/capitst/TestSafeClone " ) ;
2005-06-30 22:45:24 +00:00
addTest ( root , & TestCloneBinary , " tscoll/capitst/TestCloneBinary " ) ;
2003-05-15 18:28:41 +00:00
addTest ( root , & TestGetSetAttr , " tscoll/capitst/TestGetSetAttr " ) ;
addTest ( root , & TestBounds , " tscoll/capitst/TestBounds " ) ;
2007-03-09 07:14:25 +00:00
addTest ( root , & TestGetLocale , " tscoll/capitst/TestGetLocale " ) ;
2003-05-15 18:28:41 +00:00
addTest ( root , & TestSortKeyBufferOverrun , " tscoll/capitst/TestSortKeyBufferOverrun " ) ;
addTest ( root , & TestAttribute , " tscoll/capitst/TestAttribute " ) ;
addTest ( root , & TestGetTailoredSet , " tscoll/capitst/TestGetTailoredSet " ) ;
addTest ( root , & TestMergeSortKeys , " tscoll/capitst/TestMergeSortKeys " ) ;
2004-05-24 22:08:38 +00:00
addTest ( root , & TestShortString , " tscoll/capitst/TestShortString " ) ;
2004-06-03 20:13:58 +00:00
addTest ( root , & TestGetContractionsAndUnsafes , " tscoll/capitst/TestGetContractionsAndUnsafes " ) ;
2005-07-06 21:27:21 +00:00
addTest ( root , & TestOpenBinary , " tscoll/capitst/TestOpenBinary " ) ;
2007-06-13 22:53:28 +00:00
addTest ( root , & TestDefault , " tscoll/capitst/TestDefault " ) ;
2008-11-17 20:27:25 +00:00
addTest ( root , & TestDefaultKeyword , " tscoll/capitst/TestDefaultKeyword " ) ;
2008-09-18 23:07:16 +00:00
addTest ( root , & TestOpenVsOpenRules , " tscoll/capitst/TestOpenVsOpenRules " ) ;
2009-03-09 20:39:13 +00:00
addTest ( root , & TestGetKeywordValuesForLocale , " tscoll/capitst/TestGetKeywordValuesForLocale " ) ;
2003-05-15 18:28:41 +00:00
}
void TestGetSetAttr ( void ) {
UErrorCode status = U_ZERO_ERROR ;
UCollator * coll = ucol_open ( NULL , & status ) ;
struct attrTest {
UColAttribute att ;
UColAttributeValue val [ 5 ] ;
uint32_t valueSize ;
UColAttributeValue nonValue ;
} attrs [ ] = {
{ UCOL_FRENCH_COLLATION , { UCOL_ON , UCOL_OFF } , 2 , UCOL_SHIFTED } ,
{ UCOL_ALTERNATE_HANDLING , { UCOL_NON_IGNORABLE , UCOL_SHIFTED } , 2 , UCOL_OFF } , /* attribute for handling variable elements*/
{ UCOL_CASE_FIRST , { UCOL_OFF , UCOL_LOWER_FIRST , UCOL_UPPER_FIRST } , 3 , UCOL_SHIFTED } , /* who goes first, lower case or uppercase */
{ UCOL_CASE_LEVEL , { UCOL_ON , UCOL_OFF } , 2 , UCOL_SHIFTED } , /* do we have an extra case level */
{ UCOL_NORMALIZATION_MODE , { UCOL_ON , UCOL_OFF } , 2 , UCOL_SHIFTED } , /* attribute for normalization */
{ UCOL_DECOMPOSITION_MODE , { UCOL_ON , UCOL_OFF } , 2 , UCOL_SHIFTED } ,
{ UCOL_STRENGTH , { UCOL_PRIMARY , UCOL_SECONDARY , UCOL_TERTIARY , UCOL_QUATERNARY , UCOL_IDENTICAL } , 5 , UCOL_SHIFTED } , /* attribute for strength */
{ UCOL_HIRAGANA_QUATERNARY_MODE , { UCOL_ON , UCOL_OFF } , 2 , UCOL_SHIFTED } , /* when turned on, this attribute */
} ;
UColAttribute currAttr ;
UColAttributeValue value ;
uint32_t i = 0 , j = 0 ;
for ( i = 0 ; i < sizeof ( attrs ) / sizeof ( attrs [ 0 ] ) ; i + + ) {
currAttr = attrs [ i ] . att ;
ucol_setAttribute ( coll , currAttr , UCOL_DEFAULT , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " ucol_setAttribute with the default value returned error: %s \n " , u_errorName ( status ) ) ;
break ;
}
value = ucol_getAttribute ( coll , currAttr , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " ucol_getAttribute returned error: %s \n " , u_errorName ( status ) ) ;
break ;
}
for ( j = 0 ; j < attrs [ i ] . valueSize ; j + + ) {
ucol_setAttribute ( coll , currAttr , attrs [ i ] . val [ j ] , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " ucol_setAttribute with the value %i returned error: %s \n " , attrs [ i ] . val [ j ] , u_errorName ( status ) ) ;
break ;
2003-05-15 16:28:58 +00:00
}
2001-11-13 22:55:05 +00:00
}
2003-05-15 18:28:41 +00:00
status = U_ZERO_ERROR ;
ucol_setAttribute ( coll , currAttr , attrs [ i ] . nonValue , & status ) ;
if ( U_SUCCESS ( status ) ) {
log_err ( " ucol_setAttribute with the bad value didn't return an error \n " ) ;
break ;
1999-08-16 21:50:52 +00:00
}
2003-05-15 18:28:41 +00:00
status = U_ZERO_ERROR ;
ucol_setAttribute ( coll , currAttr , value , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " ucol_setAttribute with the default valuereturned error: %s \n " , u_errorName ( status ) ) ;
break ;
2000-08-09 22:49:33 +00:00
}
2003-05-15 18:28:41 +00:00
}
status = U_ZERO_ERROR ;
value = ucol_getAttribute ( coll , UCOL_ATTRIBUTE_COUNT , & status ) ;
if ( U_SUCCESS ( status ) ) {
log_err ( " ucol_getAttribute for UCOL_ATTRIBUTE_COUNT didn't return an error \n " ) ;
}
status = U_ZERO_ERROR ;
ucol_setAttribute ( coll , UCOL_ATTRIBUTE_COUNT , UCOL_DEFAULT , & status ) ;
if ( U_SUCCESS ( status ) ) {
log_err ( " ucol_setAttribute for UCOL_ATTRIBUTE_COUNT didn't return an error \n " ) ;
}
status = U_ZERO_ERROR ;
ucol_close ( coll ) ;
}
static void doAssert ( int condition , const char * message )
{
if ( condition = = 0 ) {
log_err ( " ERROR : %s \n " , message ) ;
}
}
#if 0
/* We don't have default rules, at least not in the previous sense */
void TestGetDefaultRules ( ) {
uint32_t size = 0 ;
UErrorCode status = U_ZERO_ERROR ;
UCollator * coll = NULL ;
int32_t len1 = 0 , len2 = 0 ;
uint8_t * binColData = NULL ;
UResourceBundle * res = NULL ;
UResourceBundle * binColl = NULL ;
uint8_t * binResult = NULL ;
const UChar * defaultRulesArray = ucol_getDefaultRulesArray ( & size ) ;
log_verbose ( " Test the function ucol_getDefaultRulesArray() \n " ) ;
coll = ucol_openRules ( defaultRulesArray , size , UCOL_ON , UCOL_PRIMARY , & status ) ;
if ( U_SUCCESS ( status ) & & coll ! = NULL ) {
binColData = ( uint8_t * ) ucol_cloneRuleData ( coll , & len1 , & status ) ;
2003-05-15 16:28:58 +00:00
2003-05-15 18:28:41 +00:00
}
status = U_ZERO_ERROR ;
res = ures_open ( NULL , " root " , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " ERROR: Failed to get resource for \" root Locale \" with %s " , myErrorName ( status ) ) ;
return ;
}
binColl = ures_getByKey ( res , " %%Collation " , binColl , & status ) ;
if ( U_SUCCESS ( status ) ) {
binResult = ( uint8_t * ) ures_getBinary ( binColl , & len2 , & status ) ;
2003-05-15 16:28:58 +00:00
if ( U_FAILURE ( status ) ) {
2003-05-15 18:28:41 +00:00
log_err ( " ERROR: ures_getBinary() failed \n " ) ;
2003-05-15 16:28:58 +00:00
}
2003-05-15 18:28:41 +00:00
} else {
log_err ( " ERROR: ures_getByKey(locale(default), %%Collation) failed " ) ;
}
if ( len1 ! = len2 ) {
log_err ( " Error: ucol_getDefaultRulesArray() failed to return the correct length. \n " ) ;
}
if ( memcmp ( binColData , binResult , len1 ) ! = 0 ) {
log_err ( " Error: ucol_getDefaultRulesArray() failed \n " ) ;
}
free ( binColData ) ;
ures_close ( binColl ) ;
ures_close ( res ) ;
ucol_close ( coll ) ;
}
# endif
/* Collator Properties
ucol_open , ucol_strcoll , getStrength / setStrength
getDecomposition / setDecomposition , getDisplayName */
void TestProperty ( )
{
UCollator * col , * ruled ;
UChar * disName ;
int32_t len = 0 , i = 0 ;
UChar * source , * target ;
int32_t tempLength ;
UErrorCode status = U_ZERO_ERROR ;
/*
All the collations have the same version in an ICU
version .
ICU 2.0 currVersionArray = { 0x18 , 0xC0 , 0x02 , 0x02 } ;
ICU 2.1 currVersionArray = { 0x19 , 0x00 , 0x03 , 0x03 } ;
ICU 2.2 currVersionArray = { 0x21 , 0x40 , 0x04 , 0x04 } ;
ICU 2.4 currVersionArray = { 0x21 , 0x40 , 0x04 , 0x04 } ;
2003-08-23 01:46:02 +00:00
ICU 2.6 currVersionArray = { 0x21 , 0x40 , 0x03 , 0x03 } ;
2005-06-24 23:09:31 +00:00
ICU 2.8 currVersionArray = { 0x29 , 0x80 , 0x00 , 0x04 } ;
2006-06-16 05:47:24 +00:00
ICU 3.4 currVersionArray = { 0x31 , 0xC0 , 0x00 , 0x04 } ;
2003-05-15 18:28:41 +00:00
*/
2008-08-08 15:04:18 +00:00
UVersionInfo currVersionArray = { 0x31 , 0xC0 , 0x00 , 0x29 } ;
2006-06-16 05:47:24 +00:00
/* ICU 3.4 had UCA 4.1 */
/*UVersionInfo currUCAVersionArray = {4, 1, 0, 0};*/
2008-04-04 22:47:43 +00:00
UVersionInfo currUCAVersionArray = { 5 , 1 , 0 , 0 } ;
2004-01-14 21:50:51 +00:00
UVersionInfo versionArray = { 0 , 0 , 0 , 0 } ;
UVersionInfo versionUCAArray = { 0 , 0 , 0 , 0 } ;
2003-05-15 18:28:41 +00:00
log_verbose ( " The property tests begin : \n " ) ;
log_verbose ( " Test ucol_strcoll : \n " ) ;
col = ucol_open ( " en_US " , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " Default Collator creation failed.: %s \n " , myErrorName ( status ) ) ;
return ;
}
ucol_getVersion ( col , versionArray ) ;
for ( i = 0 ; i < 4 ; + + i ) {
if ( versionArray [ i ] ! = currVersionArray [ i ] ) {
log_err ( " Testing ucol_getVersion() - unexpected result: %hu.%hu.%hu.%hu \n " ,
versionArray [ 0 ] , versionArray [ 1 ] , versionArray [ 2 ] , versionArray [ 3 ] ) ;
break ;
}
}
2004-01-14 21:50:51 +00:00
ucol_getUCAVersion ( col , versionUCAArray ) ;
2004-01-08 22:53:45 +00:00
for ( i = 0 ; i < 4 ; + + i ) {
2004-01-14 21:50:51 +00:00
if ( versionUCAArray [ i ] ! = currUCAVersionArray [ i ] ) {
log_err ( " Testing ucol_getUCAVersion() - unexpected result: %hu.%hu.%hu.%hu \n " ,
versionUCAArray [ 0 ] , versionUCAArray [ 1 ] , versionUCAArray [ 2 ] , versionUCAArray [ 3 ] ) ;
2004-01-08 22:53:45 +00:00
break ;
}
}
2003-05-15 18:28:41 +00:00
source = ( UChar * ) malloc ( sizeof ( UChar ) * 12 ) ;
target = ( UChar * ) malloc ( sizeof ( UChar ) * 12 ) ;
u_uastrcpy ( source , " ab " ) ;
u_uastrcpy ( target , " abc " ) ;
doAssert ( ( ucol_strcoll ( col , source , u_strlen ( source ) , target , u_strlen ( target ) ) = = UCOL_LESS ) , " ab < abc comparison failed " ) ;
u_uastrcpy ( source , " ab " ) ;
u_uastrcpy ( target , " AB " ) ;
doAssert ( ( ucol_strcoll ( col , source , u_strlen ( source ) , target , u_strlen ( target ) ) = = UCOL_LESS ) , " ab < AB comparison failed " ) ;
/* u_uastrcpy(source, "black-bird");
u_uastrcpy ( target , " blackbird " ) ; */
u_uastrcpy ( target , " black-bird " ) ;
u_uastrcpy ( source , " blackbird " ) ;
doAssert ( ( ucol_strcoll ( col , source , u_strlen ( source ) , target , u_strlen ( target ) ) = = UCOL_GREATER ) ,
" black-bird > blackbird comparison failed " ) ;
u_uastrcpy ( source , " black bird " ) ;
u_uastrcpy ( target , " black-bird " ) ;
doAssert ( ( ucol_strcoll ( col , source , u_strlen ( source ) , target , u_strlen ( target ) ) = = UCOL_LESS ) ,
" black bird < black-bird comparison failed " ) ;
u_uastrcpy ( source , " Hello " ) ;
u_uastrcpy ( target , " hello " ) ;
doAssert ( ( ucol_strcoll ( col , source , u_strlen ( source ) , target , u_strlen ( target ) ) = = UCOL_GREATER ) ,
" Hello > hello comparison failed " ) ;
free ( source ) ;
free ( target ) ;
log_verbose ( " Test ucol_strcoll ends. \n " ) ;
log_verbose ( " testing ucol_getStrength() method ... \n " ) ;
doAssert ( ( ucol_getStrength ( col ) = = UCOL_TERTIARY ) , " collation object has the wrong strength " ) ;
doAssert ( ( ucol_getStrength ( col ) ! = UCOL_PRIMARY ) , " collation object's strength is primary difference " ) ;
2003-05-15 16:28:58 +00:00
2003-05-15 18:28:41 +00:00
log_verbose ( " testing ucol_setStrength() method ... \n " ) ;
ucol_setStrength ( col , UCOL_SECONDARY ) ;
doAssert ( ( ucol_getStrength ( col ) ! = UCOL_TERTIARY ) , " collation object's strength is secondary difference " ) ;
doAssert ( ( ucol_getStrength ( col ) ! = UCOL_PRIMARY ) , " collation object's strength is primary difference " ) ;
doAssert ( ( ucol_getStrength ( col ) = = UCOL_SECONDARY ) , " collation object has the wrong strength " ) ;
log_verbose ( " Get display name for the default collation in German : \n " ) ;
len = ucol_getDisplayName ( " en_US " , " de_DE " , NULL , 0 , & status ) ;
if ( status = = U_BUFFER_OVERFLOW_ERROR ) {
status = U_ZERO_ERROR ;
disName = ( UChar * ) malloc ( sizeof ( UChar ) * ( len + 1 ) ) ;
ucol_getDisplayName ( " en_US " , " de_DE " , disName , len + 1 , & status ) ;
log_verbose ( " the display name for default collation in german: %s \n " , austrdup ( disName ) ) ;
free ( disName ) ;
1999-08-16 21:50:52 +00:00
}
2003-05-15 18:28:41 +00:00
if ( U_FAILURE ( status ) ) {
log_err ( " ERROR: in getDisplayName: %s \n " , myErrorName ( status ) ) ;
return ;
}
log_verbose ( " Default collation getDisplayName ended. \n " ) ;
ruled = ucol_open ( " da_DK " , & status ) ;
log_verbose ( " ucol_getRules() testing ... \n " ) ;
ucol_getRules ( ruled , & tempLength ) ;
doAssert ( tempLength ! = 0 , " getRules() result incorrect " ) ;
log_verbose ( " getRules tests end. \n " ) ;
2003-05-15 16:28:58 +00:00
{
2003-05-15 18:28:41 +00:00
UChar * buffer = ( UChar * ) malloc ( 200000 * sizeof ( UChar ) ) ;
int32_t bufLen = 200000 ;
buffer [ 0 ] = ' \0 ' ;
log_verbose ( " ucol_getRulesEx() testing ... \n " ) ;
tempLength = ucol_getRulesEx ( col , UCOL_TAILORING_ONLY , buffer , bufLen ) ;
2004-10-13 00:44:55 +00:00
doAssert ( tempLength = = 0x0a , " getRulesEx() result incorrect " ) ;
2003-05-15 18:28:41 +00:00
log_verbose ( " getRules tests end. \n " ) ;
2003-05-15 16:28:58 +00:00
2003-05-15 18:28:41 +00:00
log_verbose ( " ucol_getRulesEx() testing ... \n " ) ;
tempLength = ucol_getRulesEx ( col , UCOL_FULL_RULES , buffer , bufLen ) ;
doAssert ( tempLength ! = 0 , " getRulesEx() result incorrect " ) ;
log_verbose ( " getRules tests end. \n " ) ;
free ( buffer ) ;
}
ucol_close ( ruled ) ;
ucol_close ( col ) ;
log_verbose ( " open an collator for french locale " ) ;
col = ucol_open ( " fr_FR " , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " ERROR: Creating French collation failed.: %s \n " , myErrorName ( status ) ) ;
return ;
}
ucol_setStrength ( col , UCOL_PRIMARY ) ;
log_verbose ( " testing ucol_getStrength() method again ... \n " ) ;
doAssert ( ( ucol_getStrength ( col ) ! = UCOL_TERTIARY ) , " collation object has the wrong strength " ) ;
doAssert ( ( ucol_getStrength ( col ) = = UCOL_PRIMARY ) , " collation object's strength is not primary difference " ) ;
2003-05-15 16:28:58 +00:00
2003-05-15 18:28:41 +00:00
log_verbose ( " testing French ucol_setStrength() method ... \n " ) ;
ucol_setStrength ( col , UCOL_TERTIARY ) ;
doAssert ( ( ucol_getStrength ( col ) = = UCOL_TERTIARY ) , " collation object's strength is not tertiary difference " ) ;
doAssert ( ( ucol_getStrength ( col ) ! = UCOL_PRIMARY ) , " collation object's strength is primary difference " ) ;
doAssert ( ( ucol_getStrength ( col ) ! = UCOL_SECONDARY ) , " collation object's strength is secondary difference " ) ;
ucol_close ( col ) ;
log_verbose ( " Get display name for the french collation in english : \n " ) ;
len = ucol_getDisplayName ( " fr_FR " , " en_US " , NULL , 0 , & status ) ;
if ( status = = U_BUFFER_OVERFLOW_ERROR ) {
status = U_ZERO_ERROR ;
disName = ( UChar * ) malloc ( sizeof ( UChar ) * ( len + 1 ) ) ;
ucol_getDisplayName ( " fr_FR " , " en_US " , disName , len + 1 , & status ) ;
log_verbose ( " the display name for french collation in english: %s \n " , austrdup ( disName ) ) ;
free ( disName ) ;
}
if ( U_FAILURE ( status ) ) {
log_err ( " ERROR: in getDisplayName: %s \n " , myErrorName ( status ) ) ;
return ;
}
log_verbose ( " Default collation getDisplayName ended. \n " ) ;
}
/* Test RuleBasedCollator and getRules*/
void TestRuleBasedColl ( )
{
UCollator * col1 , * col2 , * col3 , * col4 ;
UCollationElements * iter1 , * iter2 ;
UChar ruleset1 [ 60 ] ;
UChar ruleset2 [ 50 ] ;
UChar teststr [ 10 ] ;
UChar teststr2 [ 10 ] ;
const UChar * rule1 , * rule2 , * rule3 , * rule4 ;
int32_t tempLength ;
UErrorCode status = U_ZERO_ERROR ;
u_uastrcpy ( ruleset1 , " &9 < a, A < b, B < c, C; ch, cH, Ch, CH < d, D, e, E " ) ;
u_uastrcpy ( ruleset2 , " &9 < a, A < b, B < c, C < d, D, e, E " ) ;
2003-09-13 00:07:12 +00:00
2003-05-15 18:28:41 +00:00
col1 = ucol_openRules ( ruleset1 , u_strlen ( ruleset1 ) , UCOL_DEFAULT , UCOL_DEFAULT_STRENGTH , NULL , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " RuleBased Collator creation failed.: %s \n " , myErrorName ( status ) ) ;
return ;
}
else
log_verbose ( " PASS: RuleBased Collator creation passed \n " ) ;
status = U_ZERO_ERROR ;
col2 = ucol_openRules ( ruleset2 , u_strlen ( ruleset2 ) , UCOL_DEFAULT , UCOL_DEFAULT_STRENGTH , NULL , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " RuleBased Collator creation failed.: %s \n " , myErrorName ( status ) ) ;
return ;
}
else
log_verbose ( " PASS: RuleBased Collator creation passed \n " ) ;
2003-05-15 16:28:58 +00:00
1999-08-16 21:50:52 +00:00
2003-05-15 18:28:41 +00:00
status = U_ZERO_ERROR ;
col3 = ucol_open ( NULL , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " Default Collator creation failed.: %s \n " , myErrorName ( status ) ) ;
return ;
}
else
log_verbose ( " PASS: Default Collator creation passed \n " ) ;
rule1 = ucol_getRules ( col1 , & tempLength ) ;
rule2 = ucol_getRules ( col2 , & tempLength ) ;
rule3 = ucol_getRules ( col3 , & tempLength ) ;
doAssert ( ( u_strcmp ( rule1 , rule2 ) ! = 0 ) , " Default collator getRules failed " ) ;
doAssert ( ( u_strcmp ( rule2 , rule3 ) ! = 0 ) , " Default collator getRules failed " ) ;
doAssert ( ( u_strcmp ( rule1 , rule3 ) ! = 0 ) , " Default collator getRules failed " ) ;
col4 = ucol_openRules ( rule2 , u_strlen ( rule2 ) , UCOL_DEFAULT , UCOL_DEFAULT_STRENGTH , NULL , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " RuleBased Collator creation failed.: %s \n " , myErrorName ( status ) ) ;
return ;
}
rule4 = ucol_getRules ( col4 , & tempLength ) ;
doAssert ( ( u_strcmp ( rule2 , rule4 ) = = 0 ) , " Default collator getRules failed " ) ;
ucol_close ( col1 ) ;
ucol_close ( col2 ) ;
ucol_close ( col3 ) ;
ucol_close ( col4 ) ;
/* tests that modifier ! is always ignored */
u_uastrcpy ( ruleset1 , " !&a<b " ) ;
teststr [ 0 ] = 0x0e40 ;
teststr [ 1 ] = 0x0e01 ;
teststr [ 2 ] = 0x0e2d ;
col1 = ucol_openRules ( ruleset1 , u_strlen ( ruleset1 ) , UCOL_DEFAULT , UCOL_DEFAULT_STRENGTH , NULL , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " RuleBased Collator creation failed.: %s \n " , myErrorName ( status ) ) ;
return ;
}
col2 = ucol_open ( " en_US " , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " en_US Collator creation failed.: %s \n " , myErrorName ( status ) ) ;
return ;
}
iter1 = ucol_openElements ( col1 , teststr , 3 , & status ) ;
iter2 = ucol_openElements ( col2 , teststr , 3 , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " ERROR: CollationElement iterator creation failed.: %s \n " , myErrorName ( status ) ) ;
return ;
}
while ( TRUE ) {
/* testing with en since thai has its own tailoring */
uint32_t ce = ucol_next ( iter1 , & status ) ;
uint32_t ce2 = ucol_next ( iter2 , & status ) ;
2004-11-11 23:34:58 +00:00
if ( U_FAILURE ( status ) ) {
2002-07-12 20:33:01 +00:00
log_err ( " ERROR: CollationElement iterator creation failed.: %s \n " , myErrorName ( status ) ) ;
return ;
2004-11-11 23:34:58 +00:00
}
2003-05-15 18:28:41 +00:00
if ( ce2 ! = ce ) {
log_err ( " ! modifier test failed " ) ;
2002-07-12 20:33:01 +00:00
}
2003-05-15 18:28:41 +00:00
if ( ce = = UCOL_NULLORDER ) {
break ;
2003-05-15 16:28:58 +00:00
}
2002-07-12 20:33:01 +00:00
}
2003-05-15 18:28:41 +00:00
ucol_closeElements ( iter1 ) ;
ucol_closeElements ( iter2 ) ;
ucol_close ( col1 ) ;
ucol_close ( col2 ) ;
/* test that we can start a rule without a & or < */
u_uastrcpy ( ruleset1 , " < z < a " ) ;
col1 = ucol_openRules ( ruleset1 , u_strlen ( ruleset1 ) , UCOL_DEFAULT , UCOL_DEFAULT_STRENGTH , NULL , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " RuleBased Collator creation failed.: %s \n " , myErrorName ( status ) ) ;
return ;
}
u_uastrcpy ( teststr , " z " ) ;
u_uastrcpy ( teststr2 , " a " ) ;
if ( ucol_greaterOrEqual ( col1 , teststr , 1 , teststr2 , 1 ) ) {
log_err ( " Rule \" z < a \" fails " ) ;
}
ucol_close ( col1 ) ;
}
void TestCompare ( )
{
UErrorCode status = U_ZERO_ERROR ;
UCollator * col ;
UChar * test1 ;
UChar * test2 ;
log_verbose ( " The compare tests begin : \n " ) ;
status = U_ZERO_ERROR ;
col = ucol_open ( " en_US " , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " ucal_open() collation creation failed.: %s \n " , myErrorName ( status ) ) ;
return ;
}
test1 = ( UChar * ) malloc ( sizeof ( UChar ) * 6 ) ;
test2 = ( UChar * ) malloc ( sizeof ( UChar ) * 6 ) ;
u_uastrcpy ( test1 , " Abcda " ) ;
u_uastrcpy ( test2 , " abcda " ) ;
log_verbose ( " Use tertiary comparison level testing .... \n " ) ;
doAssert ( ( ! ucol_equal ( col , test1 , u_strlen ( test1 ) , test2 , u_strlen ( test2 ) ) ) , " Result should be \" Abcda \" != \" abcda \" " ) ;
doAssert ( ( ucol_greater ( col , test1 , u_strlen ( test1 ) , test2 , u_strlen ( test2 ) ) ) , " Result should be \" Abcda \" >>> \" abcda \" " ) ;
doAssert ( ( ucol_greaterOrEqual ( col , test1 , u_strlen ( test1 ) , test2 , u_strlen ( test2 ) ) ) , " Result should be \" Abcda \" >>> \" abcda \" " ) ;
ucol_setStrength ( col , UCOL_SECONDARY ) ;
log_verbose ( " Use secondary comparison level testing .... \n " ) ;
doAssert ( ( ucol_equal ( col , test1 , u_strlen ( test1 ) , test2 , u_strlen ( test2 ) ) ) , " Result should be \" Abcda \" == \" abcda \" " ) ;
doAssert ( ( ! ucol_greater ( col , test1 , u_strlen ( test1 ) , test2 , u_strlen ( test2 ) ) ) , " Result should be \" Abcda \" == \" abcda \" " ) ;
doAssert ( ( ucol_greaterOrEqual ( col , test1 , u_strlen ( test1 ) , test2 , u_strlen ( test2 ) ) ) , " Result should be \" Abcda \" == \" abcda \" " ) ;
ucol_setStrength ( col , UCOL_PRIMARY ) ;
log_verbose ( " Use primary comparison level testing .... \n " ) ;
doAssert ( ( ucol_equal ( col , test1 , u_strlen ( test1 ) , test2 , u_strlen ( test2 ) ) ) , " Result should be \" Abcda \" == \" abcda \" " ) ;
doAssert ( ( ! ucol_greater ( col , test1 , u_strlen ( test1 ) , test2 , u_strlen ( test2 ) ) ) , " Result should be \" Abcda \" == \" abcda \" " ) ;
doAssert ( ( ucol_greaterOrEqual ( col , test1 , u_strlen ( test1 ) , test2 , u_strlen ( test2 ) ) ) , " Result should be \" Abcda \" == \" abcda \" " ) ;
log_verbose ( " The compare tests end. \n " ) ;
ucol_close ( col ) ;
free ( test1 ) ;
free ( test2 ) ;
}
/*
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
tests decomposition setting
*/
void TestDecomposition ( ) {
UErrorCode status = U_ZERO_ERROR ;
UCollator * en_US , * el_GR , * vi_VN ;
en_US = ucol_open ( " en_US " , & status ) ;
el_GR = ucol_open ( " el_GR " , & status ) ;
vi_VN = ucol_open ( " vi_VN " , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " ERROR: collation creation failed.: %s \n " , myErrorName ( status ) ) ;
return ;
}
if ( ucol_getAttribute ( vi_VN , UCOL_NORMALIZATION_MODE , & status ) ! = UCOL_ON | |
U_FAILURE ( status ) )
2001-05-31 23:30:09 +00:00
{
2003-05-15 18:28:41 +00:00
log_err ( " ERROR: vi_VN collation did not have cannonical decomposition for normalization! \n " ) ;
2001-11-15 17:46:51 +00:00
}
2003-05-15 18:28:41 +00:00
status = U_ZERO_ERROR ;
if ( ucol_getAttribute ( el_GR , UCOL_NORMALIZATION_MODE , & status ) ! = UCOL_ON | |
U_FAILURE ( status ) )
{
log_err ( " ERROR: el_GR collation did not have cannonical decomposition for normalization! \n " ) ;
1999-08-16 21:50:52 +00:00
}
2003-05-15 18:28:41 +00:00
status = U_ZERO_ERROR ;
if ( ucol_getAttribute ( en_US , UCOL_NORMALIZATION_MODE , & status ) ! = UCOL_OFF | |
U_FAILURE ( status ) )
{
log_err ( " ERROR: en_US collation had cannonical decomposition for normalization! \n " ) ;
}
ucol_close ( en_US ) ;
ucol_close ( el_GR ) ;
ucol_close ( vi_VN ) ;
}
2006-05-21 17:56:44 +00:00
# define CLONETEST_COLLATOR_COUNT 4
2003-05-15 18:28:41 +00:00
void TestSafeClone ( ) {
2008-02-08 09:50:36 +00:00
UChar test1 [ 6 ] ;
UChar test2 [ 6 ] ;
2006-06-05 21:56:14 +00:00
static const UChar umlautUStr [ ] = { 0x00DC , 0 } ;
static const UChar oeStr [ ] = { 0x0055 , 0x0045 , 0 } ;
2003-05-15 18:28:41 +00:00
UCollator * someCollators [ CLONETEST_COLLATOR_COUNT ] ;
UCollator * someClonedCollators [ CLONETEST_COLLATOR_COUNT ] ;
UCollator * col ;
UErrorCode err = U_ZERO_ERROR ;
2008-02-08 09:50:36 +00:00
int8_t index = 6 ; /* Leave this here to test buffer alingment in memory*/
2003-05-15 18:28:41 +00:00
uint8_t buffer [ CLONETEST_COLLATOR_COUNT ] [ U_COL_SAFECLONE_BUFFERSIZE ] ;
int32_t bufferSize = U_COL_SAFECLONE_BUFFERSIZE ;
2006-05-21 17:56:44 +00:00
const char sampleRuleChars [ ] = " &Z < CH " ;
UChar sampleRule [ sizeof ( sampleRuleChars ) ] ;
2003-05-15 18:28:41 +00:00
if ( TestBufferSize ( ) ) {
log_err ( " U_COL_SAFECLONE_BUFFERSIZE should be larger than sizeof(UCollator) \n " ) ;
return ;
}
u_uastrcpy ( test1 , " abCda " ) ;
u_uastrcpy ( test2 , " abcda " ) ;
2006-05-21 17:56:44 +00:00
u_uastrcpy ( sampleRule , sampleRuleChars ) ;
2003-05-15 18:28:41 +00:00
/* one default collator & two complex ones */
someCollators [ 0 ] = ucol_open ( " en_US " , & err ) ;
someCollators [ 1 ] = ucol_open ( " ko " , & err ) ;
someCollators [ 2 ] = ucol_open ( " ja_JP " , & err ) ;
2006-05-21 17:56:44 +00:00
someCollators [ 3 ] = ucol_openRules ( sampleRule , - 1 , UCOL_ON , UCOL_TERTIARY , NULL , & err ) ;
2003-05-15 18:28:41 +00:00
if ( U_FAILURE ( err ) ) {
2007-12-07 10:49:34 +00:00
for ( index = 0 ; index < CLONETEST_COLLATOR_COUNT ; index + + ) {
ucol_close ( someCollators [ index ] ) ;
}
2006-05-21 17:56:44 +00:00
log_data_err ( " Couldn't open one or more collators \n " ) ;
return ;
2003-05-15 18:28:41 +00:00
}
/* Check the various error & informational states: */
/* Null status - just returns NULL */
if ( 0 ! = ucol_safeClone ( someCollators [ 0 ] , buffer [ 0 ] , & bufferSize , 0 ) )
{
log_err ( " FAIL: Cloned Collator failed to deal correctly with null status \n " ) ;
}
/* error status - should return 0 & keep error the same */
err = U_MEMORY_ALLOCATION_ERROR ;
if ( 0 ! = ucol_safeClone ( someCollators [ 0 ] , buffer [ 0 ] , & bufferSize , & err ) | | err ! = U_MEMORY_ALLOCATION_ERROR )
{
log_err ( " FAIL: Cloned Collator failed to deal correctly with incoming error status \n " ) ;
}
err = U_ZERO_ERROR ;
/* Null buffer size pointer - just returns NULL & set error to U_ILLEGAL_ARGUMENT_ERROR*/
if ( 0 ! = ucol_safeClone ( someCollators [ 0 ] , buffer [ 0 ] , 0 , & err ) | | err ! = U_ILLEGAL_ARGUMENT_ERROR )
{
log_err ( " FAIL: Cloned Collator failed to deal correctly with null bufferSize pointer \n " ) ;
}
err = U_ZERO_ERROR ;
2003-05-15 16:28:58 +00:00
2003-05-15 18:28:41 +00:00
/* buffer size pointer is 0 - fill in pbufferSize with a size */
bufferSize = 0 ;
if ( 0 ! = ucol_safeClone ( someCollators [ 0 ] , buffer [ 0 ] , & bufferSize , & err ) | | U_FAILURE ( err ) | | bufferSize < = 0 )
{
log_err ( " FAIL: Cloned Collator failed a sizing request ('preflighting') \n " ) ;
}
/* Verify our define is large enough */
if ( U_COL_SAFECLONE_BUFFERSIZE < bufferSize )
{
log_err ( " FAIL: Pre-calculated buffer size is too small \n " ) ;
}
/* Verify we can use this run-time calculated size */
if ( 0 = = ( col = ucol_safeClone ( someCollators [ 0 ] , buffer [ 0 ] , & bufferSize , & err ) ) | | U_FAILURE ( err ) )
{
log_err ( " FAIL: Collator can't be cloned with run-time size \n " ) ;
}
if ( col ) ucol_close ( col ) ;
/* size one byte too small - should allocate & let us know */
- - bufferSize ;
if ( 0 = = ( col = ucol_safeClone ( someCollators [ 0 ] , 0 , & bufferSize , & err ) ) | | err ! = U_SAFECLONE_ALLOCATED_WARNING )
{
log_err ( " FAIL: Cloned Collator failed to deal correctly with too-small buffer size \n " ) ;
}
if ( col ) ucol_close ( col ) ;
err = U_ZERO_ERROR ;
bufferSize = U_COL_SAFECLONE_BUFFERSIZE ;
/* Null buffer pointer - return Collator & set error to U_SAFECLONE_ALLOCATED_ERROR */
if ( 0 = = ( col = ucol_safeClone ( someCollators [ 0 ] , 0 , & bufferSize , & err ) ) | | err ! = U_SAFECLONE_ALLOCATED_WARNING )
{
log_err ( " FAIL: Cloned Collator failed to deal correctly with null buffer pointer \n " ) ;
}
if ( col ) ucol_close ( col ) ;
err = U_ZERO_ERROR ;
/* Null Collator - return NULL & set U_ILLEGAL_ARGUMENT_ERROR */
if ( 0 ! = ucol_safeClone ( 0 , buffer [ 0 ] , & bufferSize , & err ) | | err ! = U_ILLEGAL_ARGUMENT_ERROR )
{
log_err ( " FAIL: Cloned Collator failed to deal correctly with null Collator pointer \n " ) ;
}
err = U_ZERO_ERROR ;
2006-06-05 21:56:14 +00:00
/* Test that a cloned collator doesn't accidentally use UCA. */
col = ucol_open ( " de@collation=phonebook " , & err ) ;
bufferSize = U_COL_SAFECLONE_BUFFERSIZE ;
someClonedCollators [ 0 ] = ucol_safeClone ( col , buffer [ 0 ] , & bufferSize , & err ) ;
doAssert ( ( ucol_greater ( col , umlautUStr , u_strlen ( umlautUStr ) , oeStr , u_strlen ( oeStr ) ) ) , " Original German phonebook collation sorts differently than expected " ) ;
doAssert ( ( ucol_greater ( someClonedCollators [ 0 ] , umlautUStr , u_strlen ( umlautUStr ) , oeStr , u_strlen ( oeStr ) ) ) , " Cloned German phonebook collation sorts differently than expected " ) ;
2006-06-06 00:57:04 +00:00
if ( ! ucol_equals ( someClonedCollators [ 0 ] , col ) ) {
log_err ( " FAIL: Cloned German phonebook collator is not equal to original. \n " ) ;
}
2006-06-05 21:56:14 +00:00
ucol_close ( col ) ;
ucol_close ( someClonedCollators [ 0 ] ) ;
err = U_ZERO_ERROR ;
2003-05-15 18:28:41 +00:00
/* change orig & clone & make sure they are independent */
for ( index = 0 ; index < CLONETEST_COLLATOR_COUNT ; index + + )
{
2006-05-21 21:09:01 +00:00
ucol_setStrength ( someCollators [ index ] , UCOL_IDENTICAL ) ;
bufferSize = 1 ;
err = U_ZERO_ERROR ;
ucol_close ( ucol_safeClone ( someCollators [ index ] , buffer [ index ] , & bufferSize , & err ) ) ;
if ( err ! = U_SAFECLONE_ALLOCATED_WARNING ) {
log_err ( " FAIL: collator number %d was not allocated. \n " , index ) ;
2008-04-04 22:47:43 +00:00
log_err ( " FAIL: status of Collator[%d] is %d (hex: %x). \n " , index , err , err ) ;
2006-05-21 21:09:01 +00:00
}
2003-05-15 18:28:41 +00:00
bufferSize = U_COL_SAFECLONE_BUFFERSIZE ;
2006-05-21 17:56:44 +00:00
err = U_ZERO_ERROR ;
2003-05-15 18:28:41 +00:00
someClonedCollators [ index ] = ucol_safeClone ( someCollators [ index ] , buffer [ index ] , & bufferSize , & err ) ;
2006-05-26 04:00:52 +00:00
if ( someClonedCollators [ index ] = = NULL
| | someClonedCollators [ index ] < ( UCollator * ) buffer [ index ]
| | someClonedCollators [ index ] > ( UCollator * ) ( buffer [ index ] + ( U_COL_SAFECLONE_BUFFERSIZE - 1 ) ) )
{
2006-05-21 17:56:44 +00:00
log_err ( " FAIL: Cloned collator didn't use provided buffer. \n " ) ;
2006-05-26 04:00:52 +00:00
return ;
2006-05-21 17:56:44 +00:00
}
if ( ! ucol_equals ( someClonedCollators [ index ] , someCollators [ index ] ) ) {
log_err ( " FAIL: Cloned collator is not equal to original at index = %d. \n " , index ) ;
}
2003-05-15 18:28:41 +00:00
2006-05-21 17:56:44 +00:00
/* Check the usability */
2003-05-15 18:28:41 +00:00
ucol_setStrength ( someCollators [ index ] , UCOL_PRIMARY ) ;
ucol_setAttribute ( someCollators [ index ] , UCOL_CASE_LEVEL , UCOL_OFF , & err ) ;
2003-05-15 16:28:58 +00:00
2003-05-15 18:28:41 +00:00
doAssert ( ( ucol_equal ( someCollators [ index ] , test1 , u_strlen ( test1 ) , test2 , u_strlen ( test2 ) ) ) , " Result should be \" abcda \" == \" abCda \" " ) ;
1999-08-16 21:50:52 +00:00
2006-05-21 17:56:44 +00:00
/* Close the original to make sure that the clone is usable. */
2003-05-15 18:28:41 +00:00
ucol_close ( someCollators [ index ] ) ;
2006-05-21 17:56:44 +00:00
ucol_setStrength ( someClonedCollators [ index ] , UCOL_TERTIARY ) ;
ucol_setAttribute ( someClonedCollators [ index ] , UCOL_CASE_LEVEL , UCOL_OFF , & err ) ;
doAssert ( ( ucol_greater ( someClonedCollators [ index ] , test1 , u_strlen ( test1 ) , test2 , u_strlen ( test2 ) ) ) , " Result should be \" abCda \" >>> \" abcda \" " ) ;
ucol_close ( someClonedCollators [ index ] ) ;
1999-08-16 21:50:52 +00:00
}
2003-05-15 18:28:41 +00:00
}
2005-06-30 22:45:24 +00:00
void TestCloneBinary ( ) {
UErrorCode err = U_ZERO_ERROR ;
UCollator * col = ucol_open ( " en_US " , & err ) ;
UCollator * c ;
int32_t size ;
uint8_t * buffer ;
if ( U_FAILURE ( err ) ) {
2005-07-01 05:32:06 +00:00
log_data_err ( " Couldn't open collator. Error: %s \n " , u_errorName ( err ) ) ;
return ;
2005-06-30 22:45:24 +00:00
}
size = ucol_cloneBinary ( col , NULL , 0 , & err ) ;
2005-07-07 22:48:45 +00:00
if ( size = = 0 | | err ! = U_BUFFER_OVERFLOW_ERROR ) {
2005-06-30 22:45:24 +00:00
log_err ( " ucol_cloneBinary - couldn't check size. Error: %s \n " , u_errorName ( err ) ) ;
2005-07-01 05:32:06 +00:00
return ;
2005-06-30 22:45:24 +00:00
}
2005-07-06 21:27:21 +00:00
err = U_ZERO_ERROR ;
2005-06-30 22:45:24 +00:00
buffer = ( uint8_t * ) malloc ( size ) ;
ucol_cloneBinary ( col , buffer , size , & err ) ;
if ( U_FAILURE ( err ) ) {
2005-07-01 05:32:06 +00:00
log_err ( " ucol_cloneBinary - couldn't clone.. Error: %s \n " , u_errorName ( err ) ) ;
free ( buffer ) ;
return ;
2005-06-30 22:45:24 +00:00
}
2005-07-01 05:32:06 +00:00
2005-07-14 20:12:29 +00:00
/* how to check binary result ? */
2005-07-01 05:32:06 +00:00
2005-06-30 22:45:24 +00:00
c = ucol_openBinary ( buffer , size , col , & err ) ;
if ( U_FAILURE ( err ) ) {
2005-07-01 05:32:06 +00:00
log_err ( " ucol_openBinary failed. Error: %s \n " , u_errorName ( err ) ) ;
2005-06-30 22:45:24 +00:00
} else {
UChar t [ ] = { 0x41 , 0x42 , 0x43 , 0 } ; /* ABC */
uint8_t * k1 , * k2 ;
int l1 , l2 ;
l1 = ucol_getSortKey ( col , t , - 1 , NULL , 0 ) ;
l2 = ucol_getSortKey ( c , t , - 1 , NULL , 0 ) ;
k1 = ( uint8_t * ) malloc ( sizeof ( uint8_t ) * l1 ) ;
k2 = ( uint8_t * ) malloc ( sizeof ( uint8_t ) * l2 ) ;
ucol_getSortKey ( col , t , - 1 , k1 , l1 ) ;
ucol_getSortKey ( col , t , - 1 , k2 , l2 ) ;
2005-07-06 21:27:21 +00:00
if ( strcmp ( ( char * ) k1 , ( char * ) k2 ) ! = 0 ) {
2005-06-30 22:45:24 +00:00
log_err ( " ucol_openBinary - new collator should equal to old one \n " ) ;
} ;
free ( k1 ) ;
free ( k2 ) ;
}
free ( buffer ) ;
2005-07-14 20:12:29 +00:00
ucol_close ( c ) ;
ucol_close ( col ) ;
2005-06-30 22:45:24 +00:00
}
2008-09-18 23:07:16 +00:00
/*
TestOpenVsOpenRules ensures that collators from ucol_open and ucol_openRules
will generate identical sort keys
*/
void TestOpenVsOpenRules ( ) {
/* create an array of all the locales */
int32_t numLocales = uloc_countAvailable ( ) ;
2008-09-19 00:15:13 +00:00
int32_t sizeOfStdSet ;
uint32_t adder ;
2008-10-01 16:54:07 +00:00
UChar str [ 41 ] ; /* create an array of UChar of size maximum strSize + 1 */
2008-09-19 00:15:13 +00:00
USet * stdSet ;
char * curLoc ;
UCollator * c1 ;
UCollator * c2 ;
const UChar * rules ;
int32_t rulesLength ;
int32_t sortKeyLen1 , sortKeyLen2 ;
uint8_t * sortKey1 = NULL , * sortKey2 = NULL ;
ULocaleData * uld ;
uint32_t x , y , z ;
USet * eSet ;
int32_t eSize ;
int strSize ;
2008-09-18 23:07:16 +00:00
UErrorCode err = U_ZERO_ERROR ;
/* create a set of standard characters that aren't very interesting...
and then we can find some interesting ones later */
2008-09-19 00:15:13 +00:00
stdSet = uset_open ( 0x61 , 0x7A ) ;
2008-09-18 23:07:16 +00:00
uset_addRange ( stdSet , 0x41 , 0x5A ) ;
uset_addRange ( stdSet , 0x30 , 0x39 ) ;
2008-09-19 00:15:13 +00:00
sizeOfStdSet = uset_size ( stdSet ) ;
2008-09-18 23:07:16 +00:00
2008-09-19 00:15:13 +00:00
adder = 1 ;
2008-09-18 23:07:16 +00:00
if ( QUICK )
{
adder = 10 ;
}
for ( x = 0 ; x < numLocales ; x + = adder ) {
2008-09-19 00:15:13 +00:00
curLoc = uloc_getAvailable ( x ) ;
2008-09-18 23:07:16 +00:00
log_verbose ( " Processing %s \n " , curLoc ) ;
/* create a collator the normal API way */
c1 = ucol_open ( curLoc , & err ) ;
if ( U_FAILURE ( err ) ) {
log_err ( " ERROR: Normal collation creation failed with locale: %s : %s \n " , curLoc , myErrorName ( err ) ) ;
return ;
}
/* grab the rules */
rules = ucol_getRules ( c1 , & rulesLength ) ;
/* use those rules to create a collator from rules */
c2 = ucol_openRules ( rules , rulesLength , UCOL_DEFAULT , UCOL_DEFAULT_STRENGTH , NULL , & err ) ;
if ( U_FAILURE ( err ) ) {
log_err ( " ERROR: Creating collator from rules failed with locale: %s : %s \n " , curLoc , myErrorName ( err ) ) ;
return ;
}
2008-09-19 00:15:13 +00:00
uld = ulocdata_open ( curLoc , & err ) ;
2008-09-18 23:07:16 +00:00
/*now that we have some collators, we get several strings */
2008-09-19 00:15:13 +00:00
2008-09-18 23:07:16 +00:00
for ( y = 0 ; y < 5 ; y + + ) {
/* get a set of ALL the characters in this locale */
2008-09-19 00:15:13 +00:00
eSet = ulocdata_getExemplarSet ( uld , NULL , 0 , ULOCDATA_ES_STANDARD , & err ) ;
eSize = uset_size ( eSet ) ;
2008-09-18 23:07:16 +00:00
/* make a string with these characters in it */
2008-09-19 00:15:13 +00:00
strSize = ( rand ( ) % 40 ) + 1 ;
2008-09-18 23:07:16 +00:00
for ( z = 0 ; z < strSize ; z + + ) {
str [ z ] = uset_charAt ( eSet , rand ( ) % eSize ) ;
}
/* change the set to only include 'abnormal' characters (not A-Z, a-z, 0-9 */
uset_removeAll ( eSet , stdSet ) ;
eSize = uset_size ( eSet ) ;
/* if there are some non-normal characters left, put a few into the string, just to make sure we have some */
if ( eSize > 0 ) {
str [ 2 % strSize ] = uset_charAt ( eSet , rand ( ) % eSize ) ;
str [ 3 % strSize ] = uset_charAt ( eSet , rand ( ) % eSize ) ;
str [ 5 % strSize ] = uset_charAt ( eSet , rand ( ) % eSize ) ;
str [ 10 % strSize ] = uset_charAt ( eSet , rand ( ) % eSize ) ;
str [ 13 % strSize ] = uset_charAt ( eSet , rand ( ) % eSize ) ;
}
/* terminate the string */
str [ strSize - 1 ] = ' \0 ' ;
log_verbose ( " String used: %S \n " , str ) ;
/* get sort keys for both of them, and check that the keys are identicle */
sortKeyLen1 = ucol_getSortKey ( c1 , str , u_strlen ( str ) , NULL , 0 ) ;
2008-10-01 16:54:07 +00:00
sortKey1 = ( uint8_t * ) malloc ( sizeof ( uint8_t ) * ( sortKeyLen1 + 1 ) ) ;
2008-09-18 23:07:16 +00:00
/*memset(sortKey1, 0xFE, sortKeyLen1);*/
ucol_getSortKey ( c1 , str , u_strlen ( str ) , sortKey1 , sortKeyLen1 + 1 ) ;
sortKeyLen2 = ucol_getSortKey ( c2 , str , u_strlen ( str ) , NULL , 0 ) ;
2008-10-01 16:54:07 +00:00
sortKey2 = ( uint8_t * ) malloc ( sizeof ( uint8_t ) * ( sortKeyLen2 + 1 ) ) ;
2008-09-18 23:07:16 +00:00
/*memset(sortKey2, 0xFE, sortKeyLen2);*/
ucol_getSortKey ( c2 , str , u_strlen ( str ) , sortKey2 , sortKeyLen2 + 1 ) ;
/* Check that the lengths are the same */
doAssert ( ( sortKeyLen1 = = sortKeyLen2 ) , " Sort key lengths do not match. " ) ;
/* check that the keys are the same */
doAssert ( ( memcmp ( sortKey1 , sortKey2 , sortKeyLen1 ) = = 0 ) , " Keys are not equivalent " ) ;
/* clean up after each string */
2008-10-01 16:54:07 +00:00
free ( sortKey1 ) ;
free ( sortKey2 ) ;
2008-09-18 23:07:16 +00:00
uset_close ( eSet ) ;
}
/* clean up after each locale */
ulocdata_close ( uld ) ;
ucol_close ( c1 ) ;
ucol_close ( c2 ) ;
}
2008-10-01 14:14:13 +00:00
/* final clean up */
uset_close ( stdSet ) ;
2008-09-18 23:07:16 +00:00
}
2003-05-15 18:28:41 +00:00
/*
- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
ctor - - Tests the getSortKey
*/
void TestSortKey ( )
{
uint8_t * sortk1 = NULL , * sortk2 = NULL , * sortk3 = NULL , * sortkEmpty = NULL ;
uint8_t sortk2_compat [ ] = {
2008-04-04 22:47:43 +00:00
/* 3.9 key, from UCA 5.1 */
0x2c , 0x2e , 0x30 , 0x32 , 0x2c , 0x01 ,
0x09 , 0x01 , 0x09 , 0x01 , 0x2b , 0x01 ,
0x92 , 0x93 , 0x94 , 0x95 , 0x92 , 0x0
2006-06-16 05:47:24 +00:00
/* 3.6 key, from UCA 5.0 */
2008-04-04 22:47:43 +00:00
/*
2006-06-16 05:47:24 +00:00
0x29 , 0x2b , 0x2d , 0x2f , 0x29 , 0x01 ,
0x09 , 0x01 , 0x09 , 0x01 , 0x28 , 0x01 ,
0x92 , 0x93 , 0x94 , 0x95 , 0x92 , 0x00
2008-04-04 22:47:43 +00:00
*/
2006-06-16 05:47:24 +00:00
/* 3.4 key, from UCA 4.1 */
/* 0x28, 0x2a, 0x2c, 0x2e, 0x28, 0x01, 0x09, 0x01, 0x09, 0x01, 0x27, 0x01, 0x92, 0x93, 0x94, 0x95, 0x92, 0x00 */
2005-05-19 06:45:10 +00:00
/* 2.6.1 key */
/* 0x26, 0x28, 0x2A, 0x2C, 0x26, 0x01, 0x09, 0x01, 0x09, 0x01, 0x25, 0x01, 0x92, 0x93, 0x94, 0x95, 0x92, 0x00 */
2003-05-15 18:28:41 +00:00
/* 2.2 key */
2003-08-23 01:46:02 +00:00
/*0x1D, 0x1F, 0x21, 0x23, 0x1D, 0x01, 0x09, 0x01, 0x09, 0x01, 0x1C, 0x01, 0x92, 0x93, 0x94, 0x95, 0x92, 0x00*/
2003-05-15 18:28:41 +00:00
/* 2.0 key */
/*0x19, 0x1B, 0x1D, 0x1F, 0x19, 0x01, 0x09, 0x01, 0x09, 0x01, 0x18, 0x01, 0x92, 0x93, 0x94, 0x95, 0x92, 0x00*/
/* 1.8.1 key.*/
/*0x19, 0x1B, 0x1D, 0x1F, 0x19, 0x01, 0x0A, 0x01, 0x0A, 0x01, 0x92, 0x93, 0x94, 0x95, 0x92, 0x00*/
/*this is a 1.8 sortkey */
/*0x17, 0x19, 0x1B, 0x1D, 0x17, 0x01, 0x08, 0x01, 0x08, 0x00*/
/*this is a 1.7 sortkey */
/*0x02, 0x54, 0x02, 0x55, 0x02, 0x56, 0x02, 0x57, 0x02, 0x54, 0x01, 0x02, 0x02, 0x02, 0x02, 0x02, 0x01, 0x02, 0x02, 0x02, 0x02, 0x02, 0x00*/
/* this is a 1.6 sortkey */
/*0x00, 0x53, 0x00, 0x54, 0x00, 0x55, 0x00, 0x56, 0x00, 0x53, 0x00, 0x00, 0x00, 0x01, 0x00, 0x01, 0x00, 0x01, 0x00, 0x01, 0x00, 0x01, 0x00, 0x00, 0x00, 0x01, 0x00, 0x01, 0x00, 0x01, 0x00, 0x01, 0x00, 0x01, 0x00, 0x00*/
} ;
int32_t sortklen , osortklen ;
uint32_t toStringLen = 0 ;
UCollator * col ;
UChar * test1 , * test2 , * test3 ;
UErrorCode status = U_ZERO_ERROR ;
char toStringBuffer [ 256 ] , * resultP ;
uint8_t s1 [ ] = { 0x9f , 0x00 } ;
uint8_t s2 [ ] = { 0x61 , 0x00 } ;
int strcmpResult ;
strcmpResult = strcmp ( ( const char * ) s1 , ( const char * ) s2 ) ;
log_verbose ( " strcmp(0x9f..., 0x61...) = %d \n " , strcmpResult ) ;
if ( strcmpResult < = 0 ) {
log_err ( " ERR: expected strcmp( \" 9f 00 \" , \" 61 00 \" ) to be >=0 (GREATER).. got %d. Calling strcmp() for sortkeys may not work! \n " ,
strcmpResult ) ;
}
log_verbose ( " testing SortKey begins... \n " ) ;
/* this is supposed to open default date format, but later on it treats it like it is "en_US"
- very bad if you try to run the tests on machine where default locale is NOT " en_US " */
/* col = ucol_open(NULL, &status); */
col = ucol_open ( " en_US " , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " ERROR: Default collation creation failed.: %s \n " , myErrorName ( status ) ) ;
return ;
}
if ( ucol_getStrength ( col ) ! = UCOL_DEFAULT_STRENGTH )
{
log_err ( " ERROR: default collation did not have UCOL_DEFAULT_STRENGTH ! \n " ) ;
}
/* Need to use identical strength */
ucol_setAttribute ( col , UCOL_STRENGTH , UCOL_IDENTICAL , & status ) ;
test1 = ( UChar * ) malloc ( sizeof ( UChar ) * 6 ) ;
test2 = ( UChar * ) malloc ( sizeof ( UChar ) * 6 ) ;
test3 = ( UChar * ) malloc ( sizeof ( UChar ) * 6 ) ;
memset ( test1 , 0xFE , sizeof ( UChar ) * 6 ) ;
memset ( test2 , 0xFE , sizeof ( UChar ) * 6 ) ;
memset ( test3 , 0xFE , sizeof ( UChar ) * 6 ) ;
u_uastrcpy ( test1 , " Abcda " ) ;
u_uastrcpy ( test2 , " abcda " ) ;
u_uastrcpy ( test3 , " abcda " ) ;
log_verbose ( " Use tertiary comparison level testing .... \n " ) ;
sortklen = ucol_getSortKey ( col , test1 , u_strlen ( test1 ) , NULL , 0 ) ;
sortk1 = ( uint8_t * ) malloc ( sizeof ( uint8_t ) * ( sortklen + 1 ) ) ;
memset ( sortk1 , 0xFE , sortklen ) ;
ucol_getSortKey ( col , test1 , u_strlen ( test1 ) , sortk1 , sortklen + 1 ) ;
sortklen = ucol_getSortKey ( col , test2 , u_strlen ( test2 ) , NULL , 0 ) ;
sortk2 = ( uint8_t * ) malloc ( sizeof ( uint8_t ) * ( sortklen + 1 ) ) ;
memset ( sortk2 , 0xFE , sortklen ) ;
ucol_getSortKey ( col , test2 , u_strlen ( test2 ) , sortk2 , sortklen + 1 ) ;
osortklen = sortklen ;
sortklen = ucol_getSortKey ( col , test2 , u_strlen ( test3 ) , NULL , 0 ) ;
sortk3 = ( uint8_t * ) malloc ( sizeof ( uint8_t ) * ( sortklen + 1 ) ) ;
memset ( sortk3 , 0xFE , sortklen ) ;
ucol_getSortKey ( col , test2 , u_strlen ( test2 ) , sortk3 , sortklen + 1 ) ;
doAssert ( ( sortklen = = osortklen ) , " Sortkey length should be the same (abcda, abcda) " ) ;
doAssert ( ( memcmp ( sortk1 , sortk2 , sortklen ) > 0 ) , " Result should be \" Abcda \" > \" abcda \" " ) ;
doAssert ( ( memcmp ( sortk2 , sortk1 , sortklen ) < 0 ) , " Result should be \" abcda \" < \" Abcda \" " ) ;
doAssert ( ( memcmp ( sortk2 , sortk3 , sortklen ) = = 0 ) , " Result should be \" abcda \" == \" abcda \" " ) ;
doAssert ( ( memcmp ( sortk2 , sortk2_compat , sortklen ) = = 0 ) , " Binary format for 'abcda' sortkey different! " ) ;
resultP = ucol_sortKeyToString ( col , sortk2_compat , toStringBuffer , & toStringLen ) ;
doAssert ( ( resultP ! = 0 ) , " sortKeyToString failed! " ) ;
# if 1 /* verobse log of sortkeys */
{
char junk2 [ 1000 ] ;
char junk3 [ 1000 ] ;
int i ;
strcpy ( junk2 , " abcda[2] " ) ;
strcpy ( junk3 , " abcda[3] " ) ;
for ( i = 0 ; i < sortklen ; i + + )
2003-05-15 16:28:58 +00:00
{
2003-05-15 18:28:41 +00:00
sprintf ( junk2 + strlen ( junk2 ) , " %02X " , ( int ) ( 0xFF & sortk2 [ i ] ) ) ;
sprintf ( junk3 + strlen ( junk3 ) , " %02X " , ( int ) ( 0xFF & sortk3 [ i ] ) ) ;
2003-05-15 16:28:58 +00:00
}
2003-05-15 18:28:41 +00:00
log_verbose ( " %s \n " , junk2 ) ;
log_verbose ( " %s \n " , junk3 ) ;
}
# endif
free ( sortk1 ) ;
free ( sortk2 ) ;
free ( sortk3 ) ;
log_verbose ( " Use secondary comparision level testing ... \n " ) ;
ucol_setStrength ( col , UCOL_SECONDARY ) ;
sortklen = ucol_getSortKey ( col , test1 , u_strlen ( test1 ) , NULL , 0 ) ;
sortk1 = ( uint8_t * ) malloc ( sizeof ( uint8_t ) * ( sortklen + 1 ) ) ;
ucol_getSortKey ( col , test1 , u_strlen ( test1 ) , sortk1 , sortklen + 1 ) ;
sortklen = ucol_getSortKey ( col , test2 , u_strlen ( test2 ) , NULL , 0 ) ;
sortk2 = ( uint8_t * ) malloc ( sizeof ( uint8_t ) * ( sortklen + 1 ) ) ;
ucol_getSortKey ( col , test2 , u_strlen ( test2 ) , sortk2 , sortklen + 1 ) ;
doAssert ( ! ( memcmp ( sortk1 , sortk2 , sortklen ) > 0 ) , " Result should be \" Abcda \" == \" abcda \" " ) ;
doAssert ( ! ( memcmp ( sortk2 , sortk1 , sortklen ) < 0 ) , " Result should be \" abcda \" == \" Abcda \" " ) ;
doAssert ( ( memcmp ( sortk1 , sortk2 , sortklen ) = = 0 ) , " Result should be \" abcda \" == \" abcda \" " ) ;
log_verbose ( " getting sortkey for an empty string \n " ) ;
ucol_setAttribute ( col , UCOL_STRENGTH , UCOL_TERTIARY , & status ) ;
sortklen = ucol_getSortKey ( col , test1 , 0 , NULL , 0 ) ;
sortkEmpty = ( uint8_t * ) malloc ( sizeof ( uint8_t ) * sortklen + 1 ) ;
sortklen = ucol_getSortKey ( col , test1 , 0 , sortkEmpty , sortklen + 1 ) ;
if ( sortklen ! = 3 | | sortkEmpty [ 0 ] ! = 1 | | sortkEmpty [ 0 ] ! = 1 | | sortkEmpty [ 2 ] ! = 0 ) {
log_err ( " Empty string generated wrong sortkey! \n " ) ;
}
free ( sortkEmpty ) ;
log_verbose ( " testing passing invalid string \n " ) ;
sortklen = ucol_getSortKey ( col , NULL , 0 , NULL , 0 ) ;
if ( sortklen ! = 0 ) {
log_err ( " Invalid string didn't return sortkey size of 0 \n " ) ;
}
2003-05-15 16:28:58 +00:00
2003-05-15 18:28:41 +00:00
log_verbose ( " testing sortkey ends... \n " ) ;
ucol_close ( col ) ;
free ( test1 ) ;
free ( test2 ) ;
free ( test3 ) ;
free ( sortk1 ) ;
free ( sortk2 ) ;
}
void TestHashCode ( )
{
uint8_t * sortk1 , * sortk2 , * sortk3 ;
int32_t sortk1len , sortk2len , sortk3len ;
UCollator * col ;
UChar * test1 , * test2 , * test3 ;
UErrorCode status = U_ZERO_ERROR ;
log_verbose ( " testing getHashCode begins... \n " ) ;
col = ucol_open ( " en_US " , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " ERROR: Default collation creation failed.: %s \n " , myErrorName ( status ) ) ;
return ;
}
test1 = ( UChar * ) malloc ( sizeof ( UChar ) * 6 ) ;
test2 = ( UChar * ) malloc ( sizeof ( UChar ) * 6 ) ;
test3 = ( UChar * ) malloc ( sizeof ( UChar ) * 6 ) ;
u_uastrcpy ( test1 , " Abcda " ) ;
u_uastrcpy ( test2 , " abcda " ) ;
u_uastrcpy ( test3 , " abcda " ) ;
log_verbose ( " Use tertiary comparison level testing .... \n " ) ;
sortk1len = ucol_getSortKey ( col , test1 , u_strlen ( test1 ) , NULL , 0 ) ;
sortk1 = ( uint8_t * ) malloc ( sizeof ( uint8_t ) * ( sortk1len + 1 ) ) ;
ucol_getSortKey ( col , test1 , u_strlen ( test1 ) , sortk1 , sortk1len + 1 ) ;
sortk2len = ucol_getSortKey ( col , test2 , u_strlen ( test2 ) , NULL , 0 ) ;
sortk2 = ( uint8_t * ) malloc ( sizeof ( uint8_t ) * ( sortk2len + 1 ) ) ;
ucol_getSortKey ( col , test2 , u_strlen ( test2 ) , sortk2 , sortk2len + 1 ) ;
sortk3len = ucol_getSortKey ( col , test2 , u_strlen ( test3 ) , NULL , 0 ) ;
sortk3 = ( uint8_t * ) malloc ( sizeof ( uint8_t ) * ( sortk3len + 1 ) ) ;
ucol_getSortKey ( col , test2 , u_strlen ( test2 ) , sortk3 , sortk3len + 1 ) ;
2003-05-15 16:28:58 +00:00
2003-05-15 18:28:41 +00:00
log_verbose ( " ucol_hashCode() testing ... \n " ) ;
doAssert ( ucol_keyHashCode ( sortk1 , sortk1len ) ! = ucol_keyHashCode ( sortk2 , sortk2len ) , " Hash test1 result incorrect " ) ;
doAssert ( ! ( ucol_keyHashCode ( sortk1 , sortk1len ) = = ucol_keyHashCode ( sortk2 , sortk2len ) ) , " Hash test2 result incorrect " ) ;
doAssert ( ucol_keyHashCode ( sortk2 , sortk2len ) = = ucol_keyHashCode ( sortk3 , sortk3len ) , " Hash result not equal " ) ;
log_verbose ( " hashCode tests end. \n " ) ;
ucol_close ( col ) ;
free ( sortk1 ) ;
free ( sortk2 ) ;
free ( sortk3 ) ;
free ( test1 ) ;
free ( test2 ) ;
free ( test3 ) ;
}
/*
* - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
* Tests the UCollatorElements API .
*
*/
void TestElemIter ( )
{
int32_t offset ;
int32_t order1 , order2 , order3 ;
UChar * testString1 , * testString2 ;
UCollator * col ;
UCollationElements * iterator1 , * iterator2 , * iterator3 ;
UErrorCode status = U_ZERO_ERROR ;
log_verbose ( " testing UCollatorElements begins... \n " ) ;
col = ucol_open ( " en_US " , & status ) ;
ucol_setAttribute ( col , UCOL_NORMALIZATION_MODE , UCOL_OFF , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " ERROR: Default collation creation failed.: %s \n " , myErrorName ( status ) ) ;
return ;
}
testString1 = ( UChar * ) malloc ( sizeof ( UChar ) * 150 ) ;
testString2 = ( UChar * ) malloc ( sizeof ( UChar ) * 150 ) ;
u_uastrcpy ( testString1 , " XFILE What subset of all possible test cases has the highest probability of detecting the most errors? " ) ;
u_uastrcpy ( testString2 , " Xf_ile What subset of all possible test cases has the lowest probability of detecting the least errors? " ) ;
2003-05-15 16:28:58 +00:00
2003-05-15 18:28:41 +00:00
log_verbose ( " Constructors and comparison testing.... \n " ) ;
2003-05-15 16:28:58 +00:00
2003-05-15 18:28:41 +00:00
iterator1 = ucol_openElements ( col , testString1 , u_strlen ( testString1 ) , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " ERROR: Default collationElement iterator creation failed.: %s \n " , myErrorName ( status ) ) ;
1999-08-16 21:50:52 +00:00
ucol_close ( col ) ;
2003-05-15 18:28:41 +00:00
return ;
}
else { log_verbose ( " PASS: Default collationElement iterator1 creation passed \n " ) ; }
iterator2 = ucol_openElements ( col , testString1 , u_strlen ( testString1 ) , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " ERROR: Default collationElement iterator creation failed.: %s \n " , myErrorName ( status ) ) ;
1999-08-16 21:50:52 +00:00
ucol_close ( col ) ;
2003-05-15 18:28:41 +00:00
return ;
1999-08-16 21:50:52 +00:00
}
2003-05-15 18:28:41 +00:00
else { log_verbose ( " PASS: Default collationElement iterator2 creation passed \n " ) ; }
iterator3 = ucol_openElements ( col , testString2 , u_strlen ( testString2 ) , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " ERROR: Default collationElement iterator creation failed.: %s \n " , myErrorName ( status ) ) ;
1999-08-16 21:50:52 +00:00
ucol_close ( col ) ;
2003-05-15 18:28:41 +00:00
return ;
}
else { log_verbose ( " PASS: Default collationElement iterator3 creation passed \n " ) ; }
offset = ucol_getOffset ( iterator1 ) ;
ucol_setOffset ( iterator1 , 6 , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " Error in setOffset for UCollatorElements iterator.: %s \n " , myErrorName ( status ) ) ;
return ;
}
if ( ucol_getOffset ( iterator1 ) = = 6 )
log_verbose ( " setOffset and getOffset working fine \n " ) ;
else {
log_err ( " error in set and get Offset got %d instead of 6 \n " , ucol_getOffset ( iterator1 ) ) ;
}
ucol_setOffset ( iterator1 , 0 , & status ) ;
order1 = ucol_next ( iterator1 , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " Somehow ran out of memory stepping through the iterator1.: %s \n " , myErrorName ( status ) ) ;
return ;
}
order2 = ucol_getOffset ( iterator2 ) ;
doAssert ( ( order1 ! = order2 ) , " The first iterator advance failed " ) ;
order2 = ucol_next ( iterator2 , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " Somehow ran out of memory stepping through the iterator2.: %s \n " , myErrorName ( status ) ) ;
return ;
}
order3 = ucol_next ( iterator3 , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " Somehow ran out of memory stepping through the iterator3.: %s \n " , myErrorName ( status ) ) ;
return ;
1999-08-16 21:50:52 +00:00
}
2003-05-15 18:28:41 +00:00
doAssert ( ( order1 = = order2 ) , " The second iterator advance failed should be the same as first one " ) ;
2003-05-15 16:28:58 +00:00
2003-05-15 18:28:41 +00:00
doAssert ( ( ucol_primaryOrder ( order1 ) = = ucol_primaryOrder ( order3 ) ) , " The primary orders should be identical " ) ;
doAssert ( ( ucol_secondaryOrder ( order1 ) = = ucol_secondaryOrder ( order3 ) ) , " The secondary orders should be identical " ) ;
doAssert ( ( ucol_tertiaryOrder ( order1 ) = = ucol_tertiaryOrder ( order3 ) ) , " The tertiary orders should be identical " ) ;
2003-05-15 16:28:58 +00:00
2003-05-15 18:28:41 +00:00
order1 = ucol_next ( iterator1 , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " Somehow ran out of memory stepping through the iterator2.: %s \n " , myErrorName ( status ) ) ;
return ;
}
order3 = ucol_next ( iterator3 , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " Somehow ran out of memory stepping through the iterator2.: %s \n " , myErrorName ( status ) ) ;
return ;
}
doAssert ( ( ucol_primaryOrder ( order1 ) = = ucol_primaryOrder ( order3 ) ) , " The primary orders should be identical " ) ;
doAssert ( ( ucol_tertiaryOrder ( order1 ) ! = ucol_tertiaryOrder ( order3 ) ) , " The tertiary orders should be different " ) ;
2003-05-15 16:28:58 +00:00
2003-05-15 18:28:41 +00:00
order1 = ucol_next ( iterator1 , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " Somehow ran out of memory stepping through the iterator2.: %s \n " , myErrorName ( status ) ) ;
return ;
}
order3 = ucol_next ( iterator3 , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " Somehow ran out of memory stepping through the iterator2.: %s \n " , myErrorName ( status ) ) ;
return ;
}
/* this here, my friends, is either pure lunacy or something so obsolete that even it's mother
* doesn ' t care about it . Essentialy , this test complains if secondary values for ' I ' and ' _ '
* are the same . According to the UCA , this is not true . Therefore , remove the test .
* Besides , if primary strengths for two code points are different , it doesn ' t matter one bit
* what is the relation between secondary or any other strengths .
* killed by weiv 06 / 11 / 2002.
*/
/*
doAssert ( ( ( order1 & UCOL_SECONDARYMASK ) ! = ( order3 & UCOL_SECONDARYMASK ) ) , " The secondary orders should be different " ) ;
*/
doAssert ( ( order1 ! = UCOL_NULLORDER ) , " Unexpected end of iterator reached " ) ;
free ( testString1 ) ;
free ( testString2 ) ;
ucol_closeElements ( iterator1 ) ;
ucol_closeElements ( iterator2 ) ;
ucol_closeElements ( iterator3 ) ;
ucol_close ( col ) ;
log_verbose ( " testing CollationElementIterator ends... \n " ) ;
}
void TestGetLocale ( ) {
UErrorCode status = U_ZERO_ERROR ;
const char * rules = " &a<x<y<z " ;
UChar rlz [ 256 ] = { 0 } ;
uint32_t rlzLen = u_unescape ( rules , rlz , 256 ) ;
UCollator * coll = NULL ;
const char * locale = NULL ;
int32_t i = 0 ;
2004-04-16 21:31:41 +00:00
/* Now that the collation tree is separate, actual==valid at all times. [alan] */
2003-05-15 18:28:41 +00:00
static const struct {
const char * requestedLocale ;
const char * validLocale ;
const char * actualLocale ;
} testStruct [ ] = {
2007-03-09 07:14:25 +00:00
{ " sr_RS " , " sr_Cyrl_RS " , " ru " } ,
2007-06-22 23:57:38 +00:00
{ " sh_YU " , " sr_Latn_RS " , " hr " } , /* this used to be sh, but now sh collation aliases hr */
2004-04-16 21:31:41 +00:00
{ " en_BE_FOO " , " en_BE " , " en_BE " } ,
2004-11-05 22:50:08 +00:00
{ " fr_FR_NONEXISTANT " , " fr_FR " , " fr " }
2003-05-15 18:28:41 +00:00
} ;
/* test opening collators for different locales */
for ( i = 0 ; i < sizeof ( testStruct ) / sizeof ( testStruct [ 0 ] ) ; i + + ) {
status = U_ZERO_ERROR ;
coll = ucol_open ( testStruct [ i ] . requestedLocale , & status ) ;
if ( U_FAILURE ( status ) ) {
log_err ( " Failed to open collator for %s with %s \n " , testStruct [ i ] . requestedLocale , u_errorName ( status ) ) ;
2003-05-15 16:28:58 +00:00
ucol_close ( coll ) ;
2003-05-15 18:28:41 +00:00
continue ;
2002-08-02 06:55:51 +00:00
}
2006-10-27 17:55:54 +00:00
locale = ucol_getLocale ( coll , ULOC_REQUESTED_LOCALE , & status ) ;
2003-05-15 18:28:41 +00:00
if ( strcmp ( locale , testStruct [ i ] . requestedLocale ) ! = 0 ) {
log_err ( " [Coll %s]: Error in requested locale, expected %s, got %s \n " , testStruct [ i ] . requestedLocale , testStruct [ i ] . requestedLocale , locale ) ;
2002-08-21 19:09:33 +00:00
}
2003-05-15 18:28:41 +00:00
locale = ucol_getLocale ( coll , ULOC_VALID_LOCALE , & status ) ;
if ( strcmp ( locale , testStruct [ i ] . validLocale ) ! = 0 ) {
log_err ( " [Coll %s]: Error in valid locale, expected %s, got %s \n " , testStruct [ i ] . requestedLocale , testStruct [ i ] . validLocale , locale ) ;
2002-08-21 19:09:33 +00:00
}
2003-05-15 18:28:41 +00:00
locale = ucol_getLocale ( coll , ULOC_ACTUAL_LOCALE , & status ) ;
if ( strcmp ( locale , testStruct [ i ] . actualLocale ) ! = 0 ) {
log_err ( " [Coll %s]: Error in actual locale, expected %s, got %s \n " , testStruct [ i ] . requestedLocale , testStruct [ i ] . actualLocale , locale ) ;
}
ucol_close ( coll ) ;
}
/* completely non-existant locale for collator should get a default collator */
{
UCollator * defaultColl = ucol_open ( NULL , & status ) ;
coll = ucol_open ( " blahaha " , & status ) ;
2003-06-04 06:53:23 +00:00
if ( U_SUCCESS ( status ) ) {
if ( strcmp ( ucol_getLocale ( coll , ULOC_REQUESTED_LOCALE , & status ) , " blahaha " ) ) {
log_err ( " Nonexisting locale didn't preserve the requested locale \n " ) ;
}
if ( strcmp ( ucol_getLocale ( coll , ULOC_VALID_LOCALE , & status ) ,
ucol_getLocale ( defaultColl , ULOC_VALID_LOCALE , & status ) ) ) {
log_err ( " Valid locale for nonexisting locale locale collator differs "
" from valid locale for default collator \n " ) ;
}
if ( strcmp ( ucol_getLocale ( coll , ULOC_ACTUAL_LOCALE , & status ) ,
ucol_getLocale ( defaultColl , ULOC_ACTUAL_LOCALE , & status ) ) ) {
log_err ( " Actual locale for nonexisting locale locale collator differs "
" from actual locale for default collator \n " ) ;
}
ucol_close ( coll ) ;
ucol_close ( defaultColl ) ;
} else {
log_data_err ( " Couldn't open collators \n " ) ;
2003-05-15 18:28:41 +00:00
}
}
/* collator instantiated from rules should have all three locales NULL */
coll = ucol_openRules ( rlz , rlzLen , UCOL_DEFAULT , UCOL_DEFAULT , NULL , & status ) ;
locale = ucol_getLocale ( coll , ULOC_REQUESTED_LOCALE , & status ) ;
if ( locale ! = NULL ) {
log_err ( " For collator instantiated from rules, requested locale returned %s instead of NULL \n " , locale ) ;
}
locale = ucol_getLocale ( coll , ULOC_VALID_LOCALE , & status ) ;
if ( locale ! = NULL ) {
log_err ( " For collator instantiated from rules, valid locale returned %s instead of NULL \n " , locale ) ;
}
locale = ucol_getLocale ( coll , ULOC_ACTUAL_LOCALE , & status ) ;
if ( locale ! = NULL ) {
log_err ( " For collator instantiated from rules, actual locale returned %s instead of NULL \n " , locale ) ;
}
ucol_close ( coll ) ;
}
void TestGetAll ( )
{
int32_t i , count ;
count = ucol_countAvailable ( ) ;
/* use something sensible w/o hardcoding the count */
if ( count < 0 ) {
log_err ( " Error in countAvailable(), it returned %d \n " , count ) ;
}
else {
log_verbose ( " PASS: countAvailable() successful, it returned %d \n " , count ) ;
}
for ( i = 0 ; i < count ; i + + )
log_verbose ( " %s \n " , ucol_getAvailable ( i ) ) ;
}
struct teststruct {
const char * original ;
uint8_t key [ 256 ] ;
2006-09-28 08:41:37 +00:00
} ;
2003-05-15 18:28:41 +00:00
static int compare_teststruct ( const void * string1 , const void * string2 ) {
2006-09-28 08:41:37 +00:00
return ( strcmp ( ( const char * ) ( ( struct teststruct * ) string1 ) - > key , ( const char * ) ( ( struct teststruct * ) string2 ) - > key ) ) ;
2003-05-15 18:28:41 +00:00
}
void TestBounds ( ) {
2006-09-28 08:41:37 +00:00
UErrorCode status = U_ZERO_ERROR ;
2003-05-15 18:28:41 +00:00
2006-09-28 08:41:37 +00:00
UCollator * coll = ucol_open ( " sh " , & status ) ;
2003-05-15 18:28:41 +00:00
2006-09-28 08:41:37 +00:00
uint8_t sortkey [ 512 ] , lower [ 512 ] , upper [ 512 ] ;
UChar buffer [ 512 ] ;
2003-05-15 18:28:41 +00:00
2006-09-28 08:41:37 +00:00
static const char * const test [ ] = {
" John Smith " ,
" JOHN SMITH " ,
" john SMITH " ,
" j \\ u00F6hn sm \\ u00EFth " ,
" J \\ u00F6hn Sm \\ u00EFth " ,
" J \\ u00D6HN SM \\ u00CFTH " ,
" john smithsonian " ,
" John Smithsonian " ,
} ;
2003-05-15 18:28:41 +00:00
2006-09-28 08:41:37 +00:00
struct teststruct tests [ ] = {
{ " \\ u010CAKI MIHALJ " } ,
{ " \\ u010CAKI MIHALJ " } ,
{ " \\ u010CAKI PIRO \\ u0160KA " } ,
{ " \\ u010CABAI ANDRIJA " } ,
{ " \\ u010CABAI LAJO \\ u0160 " } ,
{ " \\ u010CABAI MARIJA " } ,
{ " \\ u010CABAI STEVAN " } ,
{ " \\ u010CABAI STEVAN " } ,
{ " \\ u010CABARKAPA BRANKO " } ,
{ " \\ u010CABARKAPA MILENKO " } ,
{ " \\ u010CABARKAPA MIROSLAV " } ,
{ " \\ u010CABARKAPA SIMO " } ,
{ " \\ u010CABARKAPA STANKO " } ,
{ " \\ u010CABARKAPA TAMARA " } ,
{ " \\ u010CABARKAPA TOMA \\ u0160 " } ,
{ " \\ u010CABDARI \\ u0106 NIKOLA " } ,
{ " \\ u010CABDARI \\ u0106 ZORICA " } ,
{ " \\ u010CABI NANDOR " } ,
{ " \\ u010CABOVI \\ u0106 MILAN " } ,
{ " \\ u010CABRADI AGNEZIJA " } ,
{ " \\ u010CABRADI IVAN " } ,
{ " \\ u010CABRADI JELENA " } ,
{ " \\ u010CABRADI LJUBICA " } ,
{ " \\ u010CABRADI STEVAN " } ,
{ " \\ u010CABRDA MARTIN " } ,
{ " \\ u010CABRILO BOGDAN " } ,
{ " \\ u010CABRILO BRANISLAV " } ,
{ " \\ u010CABRILO LAZAR " } ,
{ " \\ u010CABRILO LJUBICA " } ,
{ " \\ u010CABRILO SPASOJA " } ,
{ " \\ u010CADE \\ u0160 ZDENKA " } ,
{ " \\ u010CADESKI BLAGOJE " } ,
{ " \\ u010CADOVSKI VLADIMIR " } ,
{ " \\ u010CAGLJEVI \\ u0106 TOMA " } ,
{ " \\ u010CAGOROVI \\ u0106 VLADIMIR " } ,
{ " \\ u010CAJA VANKA " } ,
{ " \\ u010CAJI \\ u0106 BOGOLJUB " } ,
{ " \\ u010CAJI \\ u0106 BORISLAV " } ,
{ " \\ u010CAJI \\ u0106 RADOSLAV " } ,
{ " \\ u010CAK \\ u0160IRAN MILADIN " } ,
{ " \\ u010CAKAN EUGEN " } ,
{ " \\ u010CAKAN EVGENIJE " } ,
{ " \\ u010CAKAN IVAN " } ,
{ " \\ u010CAKAN JULIJAN " } ,
{ " \\ u010CAKAN MIHAJLO " } ,
{ " \\ u010CAKAN STEVAN " } ,
{ " \\ u010CAKAN VLADIMIR " } ,
{ " \\ u010CAKAN VLADIMIR " } ,
{ " \\ u010CAKAN VLADIMIR " } ,
{ " \\ u010CAKARA ANA " } ,
{ " \\ u010CAKAREVI \\ u0106 MOMIR " } ,
{ " \\ u010CAKAREVI \\ u0106 NEDELJKO " } ,
{ " \\ u010CAKI \\ u0160ANDOR " } ,
{ " \\ u010CAKI AMALIJA " } ,
{ " \\ u010CAKI ANDRA \\ u0160 " } ,
{ " \\ u010CAKI LADISLAV " } ,
{ " \\ u010CAKI LAJO \\ u0160 " } ,
{ " \\ u010CAKI LASLO " } ,
} ;
2003-05-15 18:28:41 +00:00
2003-06-04 06:53:23 +00:00
2006-09-28 08:41:37 +00:00
int32_t i = 0 , j = 0 , k = 0 , buffSize = 0 , skSize = 0 , lowerSize = 0 , upperSize = 0 ;
int32_t arraySize = sizeof ( tests ) / sizeof ( tests [ 0 ] ) ;
2003-06-04 06:53:23 +00:00
2006-09-28 08:41:37 +00:00
if ( U_SUCCESS ( status ) & & coll ) {
for ( i = 0 ; i < arraySize ; i + + ) {
buffSize = u_unescape ( tests [ i ] . original , buffer , 512 ) ;
skSize = ucol_getSortKey ( coll , buffer , buffSize , tests [ i ] . key , 512 ) ;
2002-09-17 06:27:51 +00:00
}
2003-05-15 18:28:41 +00:00
2006-09-28 08:41:37 +00:00
qsort ( tests , arraySize , sizeof ( struct teststruct ) , compare_teststruct ) ;
for ( i = 0 ; i < arraySize - 1 ; i + + ) {
for ( j = i + 1 ; j < arraySize ; j + + ) {
lowerSize = ucol_getBound ( tests [ i ] . key , - 1 , UCOL_BOUND_LOWER , 1 , lower , 512 , & status ) ;
upperSize = ucol_getBound ( tests [ j ] . key , - 1 , UCOL_BOUND_UPPER , 1 , upper , 512 , & status ) ;
for ( k = i ; k < = j ; k + + ) {
if ( strcmp ( ( const char * ) lower , ( const char * ) tests [ k ] . key ) > 0 ) {
log_err ( " Problem with lower! j = %i (%s vs %s) \n " , k , tests [ k ] . original , tests [ i ] . original ) ;
}
if ( strcmp ( ( const char * ) upper , ( const char * ) tests [ k ] . key ) < = 0 ) {
log_err ( " Problem with upper! j = %i (%s vs %s) \n " , k , tests [ k ] . original , tests [ j ] . original ) ;
}
}
}
}
2003-05-15 18:28:41 +00:00
2006-09-28 08:41:37 +00:00
#if 0
for ( i = 0 ; i < 1000 ; i + + ) {
lowerRND = ( rand ( ) / ( RAND_MAX / arraySize ) ) ;
upperRND = lowerRND + ( rand ( ) / ( RAND_MAX / ( arraySize - lowerRND ) ) ) ;
lowerSize = ucol_getBound ( tests [ lowerRND ] . key , - 1 , UCOL_BOUND_LOWER , 1 , lower , 512 , & status ) ;
upperSize = ucol_getBound ( tests [ upperRND ] . key , - 1 , UCOL_BOUND_UPPER_LONG , 1 , upper , 512 , & status ) ;
for ( j = lowerRND ; j < = upperRND ; j + + ) {
if ( strcmp ( lower , tests [ j ] . key ) > 0 ) {
log_err ( " Problem with lower! j = %i (%s vs %s) \n " , j , tests [ j ] . original , tests [ lowerRND ] . original ) ;
}
if ( strcmp ( upper , tests [ j ] . key ) < = 0 ) {
log_err ( " Problem with upper! j = %i (%s vs %s) \n " , j , tests [ j ] . original , tests [ upperRND ] . original ) ;
}
}
}
2003-05-15 18:28:41 +00:00
# endif
2006-09-28 08:41:37 +00:00
for ( i = 0 ; i < sizeof ( test ) / sizeof ( test [ 0 ] ) ; i + + ) {
buffSize = u_unescape ( test [ i ] , buffer , 512 ) ;
skSize = ucol_getSortKey ( coll , buffer , buffSize , sortkey , 512 ) ;
lowerSize = ucol_getBound ( sortkey , skSize , UCOL_BOUND_LOWER , 1 , lower , 512 , & status ) ;
upperSize = ucol_getBound ( sortkey , skSize , UCOL_BOUND_UPPER_LONG , 1 , upper , 512 , & status ) ;
for ( j = i + 1 ; j < sizeof ( test ) / sizeof ( test [ 0 ] ) ; j + + ) {
buffSize = u_unescape ( test [ j ] , buffer , 512 ) ;
skSize = ucol_getSortKey ( coll , buffer , buffSize , sortkey , 512 ) ;
if ( strcmp ( ( const char * ) lower , ( const char * ) sortkey ) > 0 ) {
log_err ( " Problem with lower! i = %i, j = %i (%s vs %s) \n " , i , j , test [ i ] , test [ j ] ) ;
}
if ( strcmp ( ( const char * ) upper , ( const char * ) sortkey ) < = 0 ) {
log_err ( " Problem with upper! i = %i, j = %i (%s vs %s) \n " , i , j , test [ i ] , test [ j ] ) ;
}
}
2003-06-04 06:53:23 +00:00
}
2006-09-28 08:41:37 +00:00
ucol_close ( coll ) ;
} else {
log_data_err ( " Couldn't open collator \n " ) ;
2003-05-09 20:10:44 +00:00
}
2003-06-04 06:53:23 +00:00
2003-05-15 18:28:41 +00:00
}
static void doOverrunTest ( UCollator * coll , const UChar * uString , int32_t strLen ) {
2006-09-28 08:41:37 +00:00
int32_t skLen = 0 , skLen2 = 0 ;
uint8_t sortKey [ 256 ] ;
int32_t i , j ;
uint8_t filler = 0xFF ;
skLen = ucol_getSortKey ( coll , uString , strLen , NULL , 0 ) ;
for ( i = 0 ; i < skLen ; i + + ) {
memset ( sortKey , filler , 256 ) ;
skLen2 = ucol_getSortKey ( coll , uString , strLen , sortKey , i ) ;
if ( skLen ! = skLen2 ) {
log_err ( " For buffer size %i, got different sortkey length. Expected %i got %i \n " , i , skLen , skLen2 ) ;
}
for ( j = i ; j < 256 ; j + + ) {
if ( sortKey [ j ] ! = filler ) {
log_err ( " Something run over index %i \n " , j ) ;
break ;
}
}
2003-05-09 20:10:44 +00:00
}
2003-05-15 18:28:41 +00:00
}
/* j1865 reports that if a shorter buffer is passed to
2006-09-28 08:41:37 +00:00
* to get sort key , a buffer overrun happens in some
* cases . This test tries to check this .
*/
2003-05-15 18:28:41 +00:00
void TestSortKeyBufferOverrun ( void ) {
2006-09-28 08:41:37 +00:00
UErrorCode status = U_ZERO_ERROR ;
const char * cString = " A very Merry liTTle-lamB.. " ;
UChar uString [ 256 ] ;
int32_t strLen = 0 ;
UCollator * coll = ucol_open ( " root " , & status ) ;
strLen = u_unescape ( cString , uString , 256 ) ;
2003-05-15 18:28:41 +00:00
2006-09-28 08:41:37 +00:00
if ( U_SUCCESS ( status ) ) {
log_verbose ( " testing non ignorable \n " ) ;
ucol_setAttribute ( coll , UCOL_ALTERNATE_HANDLING , UCOL_NON_IGNORABLE , & status ) ;
doOverrunTest ( coll , uString , strLen ) ;
2003-05-15 18:28:41 +00:00
2006-09-28 08:41:37 +00:00
log_verbose ( " testing shifted \n " ) ;
ucol_setAttribute ( coll , UCOL_ALTERNATE_HANDLING , UCOL_SHIFTED , & status ) ;
doOverrunTest ( coll , uString , strLen ) ;
2003-05-15 18:28:41 +00:00
2006-09-28 08:41:37 +00:00
log_verbose ( " testing shifted quaternary \n " ) ;
ucol_setAttribute ( coll , UCOL_STRENGTH , UCOL_QUATERNARY , & status ) ;
doOverrunTest ( coll , uString , strLen ) ;
2003-05-15 18:28:41 +00:00
2006-09-28 08:41:37 +00:00
log_verbose ( " testing with french secondaries \n " ) ;
ucol_setAttribute ( coll , UCOL_FRENCH_COLLATION , UCOL_ON , & status ) ;
ucol_setAttribute ( coll , UCOL_STRENGTH , UCOL_TERTIARY , & status ) ;
ucol_setAttribute ( coll , UCOL_ALTERNATE_HANDLING , UCOL_NON_IGNORABLE , & status ) ;
doOverrunTest ( coll , uString , strLen ) ;
2003-05-15 18:28:41 +00:00
2006-09-28 08:41:37 +00:00
}
ucol_close ( coll ) ;
2003-05-15 18:28:41 +00:00
}
static void TestAttribute ( )
{
UErrorCode error = U_ZERO_ERROR ;
UCollator * coll = ucol_open ( NULL , & error ) ;
if ( U_FAILURE ( error ) ) {
log_err ( " Creation of default collator failed " ) ;
return ;
2003-05-09 20:10:44 +00:00
}
2003-05-15 18:28:41 +00:00
ucol_setAttribute ( coll , UCOL_FRENCH_COLLATION , UCOL_OFF , & error ) ;
if ( ucol_getAttribute ( coll , UCOL_FRENCH_COLLATION , & error ) ! = UCOL_OFF | |
U_FAILURE ( error ) ) {
log_err ( " Setting and retrieving of the french collation failed " ) ;
}
ucol_setAttribute ( coll , UCOL_FRENCH_COLLATION , UCOL_ON , & error ) ;
if ( ucol_getAttribute ( coll , UCOL_FRENCH_COLLATION , & error ) ! = UCOL_ON | |
U_FAILURE ( error ) ) {
log_err ( " Setting and retrieving of the french collation failed " ) ;
}
ucol_setAttribute ( coll , UCOL_ALTERNATE_HANDLING , UCOL_SHIFTED , & error ) ;
if ( ucol_getAttribute ( coll , UCOL_ALTERNATE_HANDLING , & error ) ! = UCOL_SHIFTED | |
U_FAILURE ( error ) ) {
log_err ( " Setting and retrieving of the alternate handling failed " ) ;
}
ucol_setAttribute ( coll , UCOL_ALTERNATE_HANDLING , UCOL_NON_IGNORABLE , & error ) ;
if ( ucol_getAttribute ( coll , UCOL_ALTERNATE_HANDLING , & error ) ! = UCOL_NON_IGNORABLE | |
U_FAILURE ( error ) ) {
log_err ( " Setting and retrieving of the alternate handling failed " ) ;
}
ucol_setAttribute ( coll , UCOL_CASE_FIRST , UCOL_LOWER_FIRST , & error ) ;
if ( ucol_getAttribute ( coll , UCOL_CASE_FIRST , & error ) ! = UCOL_LOWER_FIRST | |
U_FAILURE ( error ) ) {
log_err ( " Setting and retrieving of the case first attribute failed " ) ;
}
ucol_setAttribute ( coll , UCOL_CASE_FIRST , UCOL_UPPER_FIRST , & error ) ;
if ( ucol_getAttribute ( coll , UCOL_CASE_FIRST , & error ) ! = UCOL_UPPER_FIRST | |
U_FAILURE ( error ) ) {
log_err ( " Setting and retrieving of the case first attribute failed " ) ;
}
ucol_setAttribute ( coll , UCOL_CASE_LEVEL , UCOL_ON , & error ) ;
if ( ucol_getAttribute ( coll , UCOL_CASE_LEVEL , & error ) ! = UCOL_ON | |
U_FAILURE ( error ) ) {
log_err ( " Setting and retrieving of the case level attribute failed " ) ;
}
ucol_setAttribute ( coll , UCOL_CASE_LEVEL , UCOL_OFF , & error ) ;
if ( ucol_getAttribute ( coll , UCOL_CASE_LEVEL , & error ) ! = UCOL_OFF | |
U_FAILURE ( error ) ) {
log_err ( " Setting and retrieving of the case level attribute failed " ) ;
}
ucol_setAttribute ( coll , UCOL_NORMALIZATION_MODE , UCOL_ON , & error ) ;
if ( ucol_getAttribute ( coll , UCOL_NORMALIZATION_MODE , & error ) ! = UCOL_ON | |
U_FAILURE ( error ) ) {
log_err ( " Setting and retrieving of the normalization on/off attribute failed " ) ;
}
ucol_setAttribute ( coll , UCOL_NORMALIZATION_MODE , UCOL_OFF , & error ) ;
if ( ucol_getAttribute ( coll , UCOL_NORMALIZATION_MODE , & error ) ! = UCOL_OFF | |
U_FAILURE ( error ) ) {
log_err ( " Setting and retrieving of the normalization on/off attribute failed " ) ;
}
ucol_setAttribute ( coll , UCOL_STRENGTH , UCOL_PRIMARY , & error ) ;
if ( ucol_getAttribute ( coll , UCOL_STRENGTH , & error ) ! = UCOL_PRIMARY | |
U_FAILURE ( error ) ) {
log_err ( " Setting and retrieving of the collation strength failed " ) ;
}
ucol_setAttribute ( coll , UCOL_STRENGTH , UCOL_SECONDARY , & error ) ;
if ( ucol_getAttribute ( coll , UCOL_STRENGTH , & error ) ! = UCOL_SECONDARY | |
U_FAILURE ( error ) ) {
log_err ( " Setting and retrieving of the collation strength failed " ) ;
}
ucol_setAttribute ( coll , UCOL_STRENGTH , UCOL_TERTIARY , & error ) ;
if ( ucol_getAttribute ( coll , UCOL_STRENGTH , & error ) ! = UCOL_TERTIARY | |
U_FAILURE ( error ) ) {
log_err ( " Setting and retrieving of the collation strength failed " ) ;
}
ucol_setAttribute ( coll , UCOL_STRENGTH , UCOL_QUATERNARY , & error ) ;
if ( ucol_getAttribute ( coll , UCOL_STRENGTH , & error ) ! = UCOL_QUATERNARY | |
U_FAILURE ( error ) ) {
log_err ( " Setting and retrieving of the collation strength failed " ) ;
}
ucol_setAttribute ( coll , UCOL_STRENGTH , UCOL_IDENTICAL , & error ) ;
if ( ucol_getAttribute ( coll , UCOL_STRENGTH , & error ) ! = UCOL_IDENTICAL | |
U_FAILURE ( error ) ) {
log_err ( " Setting and retrieving of the collation strength failed " ) ;
}
ucol_close ( coll ) ;
}
void TestGetTailoredSet ( ) {
struct {
const char * rules ;
const char * tests [ 20 ] ;
int32_t testsize ;
} setTest [ ] = {
{ " &a < \\ u212b " , { " \\ u212b " , " A \\ u030a " , " \\ u00c5 " } , 3 } ,
{ " & S < \\ u0161 <<< \\ u0160 " , { " \\ u0161 " , " s \\ u030C " , " \\ u0160 " , " S \\ u030C " } , 4 }
} ;
int32_t i = 0 , j = 0 ;
UErrorCode status = U_ZERO_ERROR ;
UParseError pError ;
UCollator * coll = NULL ;
UChar buff [ 1024 ] ;
int32_t buffLen = 0 ;
USet * set = NULL ;
for ( i = 0 ; i < sizeof ( setTest ) / sizeof ( setTest [ 0 ] ) ; i + + ) {
buffLen = u_unescape ( setTest [ i ] . rules , buff , 1024 ) ;
coll = ucol_openRules ( buff , buffLen , UCOL_DEFAULT , UCOL_DEFAULT , & pError , & status ) ;
if ( U_SUCCESS ( status ) ) {
set = ucol_getTailoredSet ( coll , & status ) ;
if ( uset_size ( set ) ! = setTest [ i ] . testsize ) {
log_err ( " Tailored set size different (%d) than expected (%d) \n " , uset_size ( set ) , setTest [ i ] . testsize ) ;
}
for ( j = 0 ; j < setTest [ i ] . testsize ; j + + ) {
buffLen = u_unescape ( setTest [ i ] . tests [ j ] , buff , 1024 ) ;
if ( ! uset_containsString ( set , buff , buffLen ) ) {
log_err ( " Tailored set doesn't contain %s... It should \n " , setTest [ i ] . tests [ j ] ) ;
2003-05-15 16:28:58 +00:00
}
}
2003-05-15 18:28:41 +00:00
uset_close ( set ) ;
} else {
log_err ( " Couldn't open collator with rules %s \n " , setTest [ i ] . rules ) ;
2003-05-09 20:10:44 +00:00
}
2003-05-15 18:28:41 +00:00
ucol_close ( coll ) ;
}
}
static int tMemCmp ( const uint8_t * first , const uint8_t * second ) {
2004-11-05 17:21:42 +00:00
int32_t firstLen = ( int32_t ) strlen ( ( const char * ) first ) ;
int32_t secondLen = ( int32_t ) strlen ( ( const char * ) second ) ;
2003-05-15 16:28:58 +00:00
return memcmp ( first , second , uprv_min ( firstLen , secondLen ) ) ;
2003-05-15 18:28:41 +00:00
}
static const char * strengthsC [ ] = {
2003-05-15 16:28:58 +00:00
" UCOL_PRIMARY " ,
" UCOL_SECONDARY " ,
" UCOL_TERTIARY " ,
" UCOL_QUATERNARY " ,
" UCOL_IDENTICAL "
2003-05-15 18:28:41 +00:00
} ;
2003-05-15 16:28:58 +00:00
2003-05-15 18:28:41 +00:00
void TestMergeSortKeys ( void ) {
2003-05-15 16:28:58 +00:00
UErrorCode status = U_ZERO_ERROR ;
2003-06-04 06:53:23 +00:00
UCollator * coll = ucol_open ( " en " , & status ) ;
if ( U_SUCCESS ( status ) ) {
2003-05-15 16:28:58 +00:00
2003-06-04 06:53:23 +00:00
const char * cases [ ] = {
" abc " ,
" abcd " ,
" abcde "
} ;
uint32_t casesSize = sizeof ( cases ) / sizeof ( cases [ 0 ] ) ;
const char * prefix = " foo " ;
const char * suffix = " egg " ;
char outBuff1 [ 256 ] , outBuff2 [ 256 ] ;
2003-05-15 16:28:58 +00:00
2003-06-04 06:53:23 +00:00
uint8_t * * sortkeys = ( uint8_t * * ) malloc ( casesSize * sizeof ( uint8_t * ) ) ;
uint8_t * * mergedPrefixkeys = ( uint8_t * * ) malloc ( casesSize * sizeof ( uint8_t * ) ) ;
uint8_t * * mergedSuffixkeys = ( uint8_t * * ) malloc ( casesSize * sizeof ( uint8_t * ) ) ;
uint32_t * sortKeysLen = ( uint32_t * ) malloc ( casesSize * sizeof ( uint32_t ) ) ;
uint8_t prefixKey [ 256 ] , suffixKey [ 256 ] ;
uint32_t prefixKeyLen = 0 , suffixKeyLen = 0 , i = 0 ;
UChar buffer [ 256 ] ;
uint32_t unescapedLen = 0 , l1 = 0 , l2 = 0 ;
UColAttributeValue strength ;
2003-05-15 16:28:58 +00:00
2003-06-04 06:53:23 +00:00
log_verbose ( " ucol_mergeSortkeys test \n " ) ;
log_verbose ( " Testing order of the test cases \n " ) ;
genericLocaleStarter ( " en " , cases , casesSize ) ;
2003-05-15 16:28:58 +00:00
2003-06-04 06:53:23 +00:00
for ( i = 0 ; i < casesSize ; i + + ) {
sortkeys [ i ] = ( uint8_t * ) malloc ( 256 * sizeof ( uint8_t ) ) ;
mergedPrefixkeys [ i ] = ( uint8_t * ) malloc ( 256 * sizeof ( uint8_t ) ) ;
mergedSuffixkeys [ i ] = ( uint8_t * ) malloc ( 256 * sizeof ( uint8_t ) ) ;
}
2003-05-15 16:28:58 +00:00
2003-06-04 06:53:23 +00:00
unescapedLen = u_unescape ( prefix , buffer , 256 ) ;
prefixKeyLen = ucol_getSortKey ( coll , buffer , unescapedLen , prefixKey , 256 ) ;
2003-05-15 16:28:58 +00:00
2003-06-04 06:53:23 +00:00
unescapedLen = u_unescape ( suffix , buffer , 256 ) ;
suffixKeyLen = ucol_getSortKey ( coll , buffer , unescapedLen , suffixKey , 256 ) ;
2003-05-15 16:28:58 +00:00
2003-06-04 06:53:23 +00:00
log_verbose ( " Massaging data with prefixes and different strengths \n " ) ;
strength = UCOL_PRIMARY ;
while ( strength < = UCOL_IDENTICAL ) {
log_verbose ( " Strength %s \n " , strengthsC [ strength < = UCOL_QUATERNARY ? strength : 4 ] ) ;
ucol_setAttribute ( coll , UCOL_STRENGTH , strength , & status ) ;
for ( i = 0 ; i < casesSize ; i + + ) {
unescapedLen = u_unescape ( cases [ i ] , buffer , 256 ) ;
sortKeysLen [ i ] = ucol_getSortKey ( coll , buffer , unescapedLen , sortkeys [ i ] , 256 ) ;
ucol_mergeSortkeys ( prefixKey , prefixKeyLen , sortkeys [ i ] , sortKeysLen [ i ] , mergedPrefixkeys [ i ] , 256 ) ;
ucol_mergeSortkeys ( sortkeys [ i ] , sortKeysLen [ i ] , suffixKey , suffixKeyLen , mergedSuffixkeys [ i ] , 256 ) ;
if ( i > 0 ) {
if ( tMemCmp ( mergedPrefixkeys [ i - 1 ] , mergedPrefixkeys [ i ] ) > = 0 ) {
log_err ( " Error while comparing prefixed keys @ strength %s: \n " , strengthsC [ strength < = UCOL_QUATERNARY ? strength : 4 ] ) ;
log_err ( " %s \n %s \n " ,
ucol_sortKeyToString ( coll , mergedPrefixkeys [ i - 1 ] , outBuff1 , & l1 ) ,
ucol_sortKeyToString ( coll , mergedPrefixkeys [ i ] , outBuff2 , & l2 ) ) ;
}
if ( tMemCmp ( mergedSuffixkeys [ i - 1 ] , mergedSuffixkeys [ i ] ) > = 0 ) {
log_err ( " Error while comparing suffixed keys @ strength %s: \n " , strengthsC [ strength < = UCOL_QUATERNARY ? strength : 4 ] ) ;
log_err ( " %s \n %s \n " ,
ucol_sortKeyToString ( coll , mergedSuffixkeys [ i - 1 ] , outBuff1 , & l1 ) ,
ucol_sortKeyToString ( coll , mergedSuffixkeys [ i ] , outBuff2 , & l2 ) ) ;
}
2003-05-15 16:28:58 +00:00
}
}
2003-06-04 06:53:23 +00:00
if ( strength = = UCOL_QUATERNARY ) {
strength = UCOL_IDENTICAL ;
} else {
strength + + ;
}
2003-05-15 16:28:58 +00:00
}
2003-06-04 06:53:23 +00:00
{
uint8_t smallBuf [ 3 ] ;
uint32_t reqLen = 0 ;
log_verbose ( " testing buffer overflow \n " ) ;
reqLen = ucol_mergeSortkeys ( prefixKey , prefixKeyLen , suffixKey , suffixKeyLen , smallBuf , 3 ) ;
if ( reqLen ! = ( prefixKeyLen + suffixKeyLen - 1 ) ) {
log_err ( " Wrong preflight size for merged sortkey \n " ) ;
}
2003-05-15 16:28:58 +00:00
}
2003-06-04 06:53:23 +00:00
{
UChar empty = 0 ;
uint8_t emptyKey [ 20 ] , abcKey [ 50 ] , mergedKey [ 100 ] ;
int32_t emptyKeyLen = 0 , abcKeyLen = 0 , mergedKeyLen = 0 ;
2003-05-15 16:28:58 +00:00
2003-06-04 06:53:23 +00:00
log_verbose ( " testing merging with sortkeys generated for empty strings \n " ) ;
emptyKeyLen = ucol_getSortKey ( coll , & empty , 0 , emptyKey , 20 ) ;
unescapedLen = u_unescape ( cases [ 0 ] , buffer , 256 ) ;
abcKeyLen = ucol_getSortKey ( coll , buffer , unescapedLen , abcKey , 50 ) ;
mergedKeyLen = ucol_mergeSortkeys ( emptyKey , emptyKeyLen , abcKey , abcKeyLen , mergedKey , 100 ) ;
if ( mergedKey [ 0 ] ! = 2 ) {
log_err ( " Empty sortkey didn't produce a level separator \n " ) ;
}
/* try with zeros */
mergedKeyLen = ucol_mergeSortkeys ( emptyKey , 0 , abcKey , abcKeyLen , mergedKey , 100 ) ;
if ( mergedKeyLen ! = 0 | | mergedKey [ 0 ] ! = 0 ) {
log_err ( " Empty key didn't produce null mergedKey \n " ) ;
}
mergedKeyLen = ucol_mergeSortkeys ( abcKey , abcKeyLen , emptyKey , 0 , mergedKey , 100 ) ;
if ( mergedKeyLen ! = 0 | | mergedKey [ 0 ] ! = 0 ) {
log_err ( " Empty key didn't produce null mergedKey \n " ) ;
}
2003-05-15 16:28:58 +00:00
2003-06-04 06:53:23 +00:00
}
2003-05-15 16:28:58 +00:00
2003-06-04 06:53:23 +00:00
for ( i = 0 ; i < casesSize ; i + + ) {
free ( sortkeys [ i ] ) ;
free ( mergedPrefixkeys [ i ] ) ;
free ( mergedSuffixkeys [ i ] ) ;
}
free ( sortkeys ) ;
free ( mergedPrefixkeys ) ;
free ( mergedSuffixkeys ) ;
free ( sortKeysLen ) ;
ucol_close ( coll ) ;
/* need to finish this up */
} else {
log_data_err ( " Couldn't open collator " ) ;
2003-05-15 16:28:58 +00:00
}
2003-05-15 18:28:41 +00:00
}
2004-05-24 22:08:38 +00:00
static void TestShortString ( void )
{
struct {
const char * input ;
const char * expectedOutput ;
const char * locale ;
UErrorCode expectedStatus ;
int32_t expectedOffset ;
uint32_t expectedIdentifier ;
} testCases [ ] = {
2008-04-04 22:47:43 +00:00
{ " LDE_RDE_KPHONEBOOK_T0041_ZLATN " , " B2C00_KPHONEBOOK_LDE " , " de@collation=phonebook " , U_USING_FALLBACK_WARNING , 0 , 0 } ,
2004-05-24 22:08:38 +00:00
{ " LEN_RUS_NO_AS_S4 " , " AS_LEN_NO_S4 " , NULL , U_USING_FALLBACK_WARNING , 0 , 0 } ,
{ " LDE_VPHONEBOOK_EO_SI " , " EO_KPHONEBOOK_LDE_SI " , " de@collation=phonebook " , U_ZERO_ERROR , 0 , 0 } ,
{ " LDE_Kphonebook " , " KPHONEBOOK_LDE " , " de@collation=phonebook " , U_ZERO_ERROR , 0 , 0 } ,
{ " Xqde_DE@collation=phonebookq_S3_EX " , " KPHONEBOOK_LDE " , " de@collation=phonebook " , U_USING_FALLBACK_WARNING , 0 , 0 } ,
{ " LFR_FO " , " LFR " , NULL , U_ZERO_ERROR , 0 , 0 } ,
2004-05-25 23:00:52 +00:00
{ " SO_LX_AS " , " " , NULL , U_ILLEGAL_ARGUMENT_ERROR , 8 , 0 } ,
2004-05-24 22:08:38 +00:00
{ " S3_ASS_MMM " , " " , NULL , U_ILLEGAL_ARGUMENT_ERROR , 5 , 0 }
} ;
2008-02-08 09:50:36 +00:00
int32_t i = 0 ;
2008-01-05 01:27:56 +00:00
UCollator * coll = NULL , * fromNormalized = NULL ;
2004-05-24 22:08:38 +00:00
UParseError parseError ;
UErrorCode status = U_ZERO_ERROR ;
2008-01-05 01:27:56 +00:00
char fromShortBuffer [ 256 ] , normalizedBuffer [ 256 ] , fromNormalizedBuffer [ 256 ] ;
2004-05-24 22:08:38 +00:00
const char * locale = NULL ;
for ( i = 0 ; i < sizeof ( testCases ) / sizeof ( testCases [ 0 ] ) ; i + + ) {
status = U_ZERO_ERROR ;
if ( testCases [ i ] . locale ) {
locale = testCases [ i ] . locale ;
} else {
locale = NULL ;
}
coll = ucol_openFromShortString ( testCases [ i ] . input , FALSE , & parseError , & status ) ;
if ( status ! = testCases [ i ] . expectedStatus ) {
log_err ( " Got status '%s' that is different from expected '%s' for '%s' \n " ,
u_errorName ( status ) , u_errorName ( testCases [ i ] . expectedStatus ) , testCases [ i ] . input ) ;
}
if ( U_SUCCESS ( status ) ) {
ucol_getShortDefinitionString ( coll , locale , fromShortBuffer , 256 , & status ) ;
if ( strcmp ( fromShortBuffer , testCases [ i ] . expectedOutput ) ) {
log_err ( " Got short string '%s' from the collator. Expected '%s' for input '%s' \n " ,
fromShortBuffer , testCases [ i ] . expectedOutput , testCases [ i ] . input ) ;
}
ucol_normalizeShortDefinitionString ( testCases [ i ] . input , normalizedBuffer , 256 , & parseError , & status ) ;
fromNormalized = ucol_openFromShortString ( normalizedBuffer , FALSE , & parseError , & status ) ;
ucol_getShortDefinitionString ( fromNormalized , locale , fromNormalizedBuffer , 256 , & status ) ;
if ( strcmp ( fromShortBuffer , fromNormalizedBuffer ) ) {
log_err ( " Strings obtained from collators instantiated by short string ('%s') and from normalized string ('%s') differ \n " ,
fromShortBuffer , fromNormalizedBuffer ) ;
}
if ( ! ucol_equals ( coll , fromNormalized ) ) {
log_err ( " Collator from short string ('%s') differs from one obtained through a normalized version ('%s') \n " ,
testCases [ i ] . input , normalizedBuffer ) ;
}
ucol_close ( fromNormalized ) ;
ucol_close ( coll ) ;
} else {
if ( parseError . offset ! = testCases [ i ] . expectedOffset ) {
log_err ( " Got parse error offset %i, but expected %i instead for '%s' \n " ,
parseError . offset , testCases [ i ] . expectedOffset , testCases [ i ] . input ) ;
}
}
}
}
2004-06-03 20:13:58 +00:00
static void
2007-07-25 18:46:17 +00:00
doSetsTest ( const char * locale , const USet * ref , USet * set , const char * inSet , const char * outSet , UErrorCode * status ) {
2004-06-03 20:13:58 +00:00
UChar buffer [ 512 ] ;
int32_t bufLen ;
uset_clear ( set ) ;
bufLen = u_unescape ( inSet , buffer , 512 ) ;
uset_applyPattern ( set , buffer , bufLen , 0 , status ) ;
if ( U_FAILURE ( * status ) ) {
2007-07-25 18:46:17 +00:00
log_err ( " %s: Failure setting pattern %s \n " , locale , u_errorName ( * status ) ) ;
2004-06-03 20:13:58 +00:00
}
if ( ! uset_containsAll ( ref , set ) ) {
2007-07-25 18:46:17 +00:00
log_err ( " %s: Some stuff from %s is not present in the set \n " , locale , inSet ) ;
2004-06-03 20:13:58 +00:00
}
uset_clear ( set ) ;
bufLen = u_unescape ( outSet , buffer , 512 ) ;
uset_applyPattern ( set , buffer , bufLen , 0 , status ) ;
if ( U_FAILURE ( * status ) ) {
2007-07-25 18:46:17 +00:00
log_err ( " %s: Failure setting pattern %s \n " , locale , u_errorName ( * status ) ) ;
2004-06-03 20:13:58 +00:00
}
if ( ! uset_containsNone ( ref , set ) ) {
2007-07-25 18:46:17 +00:00
log_err ( " %s: Some stuff from %s is present in the set \n " , locale , outSet ) ;
2004-06-03 20:13:58 +00:00
}
}
static void
TestGetContractionsAndUnsafes ( void )
{
static struct {
const char * locale ;
const char * inConts ;
const char * outConts ;
2005-06-21 20:43:04 +00:00
const char * inExp ;
const char * outExp ;
2004-06-03 20:13:58 +00:00
const char * unsafeCodeUnits ;
const char * safeCodeUnits ;
} tests [ ] = {
{ " ru " ,
" [{ \\ u0474 \\ u030F}{ \\ u0475 \\ u030F}{ \\ u04D8 \\ u0308}{ \\ u04D9 \\ u0308}{ \\ u04E8 \\ u0308}{ \\ u04E9 \\ u0308}] " ,
" [{ \\ u0430 \\ u0306}{ \\ u0410 \\ u0306}{ \\ u0430 \\ u0308}{ \\ u0410 \\ u0306}{ \\ u0433 \\ u0301}{ \\ u0413 \\ u0301}] " ,
2005-06-21 20:43:04 +00:00
" [ \\ u00e6] " ,
" [a] " ,
2004-06-14 21:00:06 +00:00
" [ \\ u0474 \\ u0475 \\ u04d8 \\ u04d9 \\ u04e8 \\ u04e9] " ,
" [aAbB \\ u0430 \\ u0410 \\ u0433 \\ u0413] "
2004-06-03 20:13:58 +00:00
} ,
{ " uk " ,
" [{ \\ u0474 \\ u030F}{ \\ u0475 \\ u030F}{ \\ u04D8 \\ u0308}{ \\ u04D9 \\ u0308}{ \\ u04E8 \\ u0308}{ \\ u04E9 \\ u0308} "
" { \\ u0430 \\ u0306}{ \\ u0410 \\ u0306}{ \\ u0430 \\ u0308}{ \\ u0410 \\ u0306}{ \\ u0433 \\ u0301}{ \\ u0413 \\ u0301}] " ,
" [] " ,
2005-06-21 20:43:04 +00:00
" [ \\ u00e6] " ,
" [a] " ,
2004-06-14 21:00:06 +00:00
" [ \\ u0474 \\ u0475 \\ u04D8 \\ u04D9 \\ u04E8 \\ u04E9 \\ u0430 \\ u0410 \\ u0433 \\ u0413] " ,
" [aAbBxv] " ,
2004-06-03 20:13:58 +00:00
} ,
{ " sh " ,
" [{C \\ u0301}{C \\ u030C}{C \\ u0341}{DZ \\ u030C}{Dz \\ u030C}{D \\ u017D}{D \\ u017E}{lj}{nj}] " ,
" [{ \\ u309d \\ u3099}{ \\ u30fd \\ u3099}] " ,
2005-06-21 20:43:04 +00:00
" [ \\ u00e6] " ,
" [a] " ,
2004-06-14 21:00:06 +00:00
" [nlcdzNLCDZ] " ,
" [jabv] "
2005-06-21 20:43:04 +00:00
} ,
{ " ja " ,
" [{ \\ u3053 \\ u3099 \\ u309D}{ \\ u3053 \\ u3099 \\ u309D \\ u3099}{ \\ u3053 \\ u3099 \\ u309E}{ \\ u3053 \\ u3099 \\ u30FC}{ \\ u3053 \\ u309D}{ \\ u3053 \\ u309D \\ u3099}{ \\ u3053 \\ u309E}{ \\ u3053 \\ u30FC}{ \\ u30B3 \\ u3099 \\ u30FC}{ \\ u30B3 \\ u3099 \\ u30FD}{ \\ u30B3 \\ u3099 \\ u30FD \\ u3099}{ \\ u30B3 \\ u3099 \\ u30FE}{ \\ u30B3 \\ u30FC}{ \\ u30B3 \\ u30FD}{ \\ u30B3 \\ u30FD \\ u3099}{ \\ u30B3 \\ u30FE}] " ,
" [{ \\ u30FD \\ u3099}{ \\ u309D \\ u3099}{ \\ u3053 \\ u3099}{ \\ u30B3 \\ u3099}{lj}{nj}] " ,
" [ \\ u30FE \\ u00e6] " ,
" [a] " ,
" [ \\ u3099] " ,
" [] "
2004-06-03 20:13:58 +00:00
}
} ;
UErrorCode status = U_ZERO_ERROR ;
UCollator * coll = NULL ;
int32_t i = 0 ;
int32_t noConts = 0 ;
USet * conts = uset_open ( 0 , 0 ) ;
2005-06-21 20:43:04 +00:00
USet * exp = uset_open ( 0 , 0 ) ;
2004-06-03 20:13:58 +00:00
USet * set = uset_open ( 0 , 0 ) ;
2005-06-21 20:43:04 +00:00
int32_t setBufferLen = 65536 ;
UChar buffer [ 65536 ] ;
2004-06-03 20:13:58 +00:00
int32_t setLen = 0 ;
for ( i = 0 ; i < sizeof ( tests ) / sizeof ( tests [ 0 ] ) ; i + + ) {
log_verbose ( " Testing locale: %s \n " , tests [ i ] . locale ) ;
coll = ucol_open ( tests [ i ] . locale , & status ) ;
2005-06-21 20:43:04 +00:00
ucol_getContractionsAndExpansions ( coll , conts , exp , TRUE , & status ) ;
2007-07-25 18:46:17 +00:00
doSetsTest ( tests [ i ] . locale , conts , set , tests [ i ] . inConts , tests [ i ] . outConts , & status ) ;
2005-06-21 20:43:04 +00:00
setLen = uset_toPattern ( conts , buffer , setBufferLen , TRUE , & status ) ;
2004-06-03 20:13:58 +00:00
if ( U_SUCCESS ( status ) ) {
2005-06-21 20:43:04 +00:00
/*log_verbose("Contractions %i: %s\n", uset_getItemCount(conts), aescstrdup(buffer, setLen));*/
2004-06-03 20:13:58 +00:00
} else {
log_err ( " error %s. %i \n " , u_errorName ( status ) , setLen ) ;
2005-06-21 20:43:04 +00:00
status = U_ZERO_ERROR ;
}
2007-07-25 18:46:17 +00:00
doSetsTest ( tests [ i ] . locale , exp , set , tests [ i ] . inExp , tests [ i ] . outExp , & status ) ;
2005-06-21 20:43:04 +00:00
setLen = uset_toPattern ( exp , buffer , setBufferLen , TRUE , & status ) ;
if ( U_SUCCESS ( status ) ) {
/*log_verbose("Expansions %i: %s\n", uset_getItemCount(exp), aescstrdup(buffer, setLen));*/
} else {
log_err ( " error %s. %i \n " , u_errorName ( status ) , setLen ) ;
status = U_ZERO_ERROR ;
2004-06-03 20:13:58 +00:00
}
noConts = ucol_getUnsafeSet ( coll , conts , & status ) ;
2007-07-25 18:46:17 +00:00
doSetsTest ( tests [ i ] . locale , conts , set , tests [ i ] . unsafeCodeUnits , tests [ i ] . safeCodeUnits , & status ) ;
2005-06-21 20:43:04 +00:00
setLen = uset_toPattern ( conts , buffer , setBufferLen , TRUE , & status ) ;
if ( U_SUCCESS ( status ) ) {
log_verbose ( " Unsafe %i: %s \n " , uset_getItemCount ( exp ) , aescstrdup ( buffer , setLen ) ) ;
} else {
log_err ( " error %s. %i \n " , u_errorName ( status ) , setLen ) ;
status = U_ZERO_ERROR ;
}
2004-06-03 20:13:58 +00:00
ucol_close ( coll ) ;
}
uset_close ( conts ) ;
2005-06-27 16:21:32 +00:00
uset_close ( exp ) ;
2004-06-03 20:13:58 +00:00
uset_close ( set ) ;
}
2005-07-06 21:27:21 +00:00
static void
TestOpenBinary ( void )
{
2007-06-13 22:53:28 +00:00
UErrorCode status = U_ZERO_ERROR ;
/*
char rule [ ] = " &h < d < c < b " ;
char * wUCA [ ] = { " a " , " h " , " d " , " c " , " b " , " i " } ;
char * noUCA [ ] = { " d " , " c " , " b " , " a " , " h " , " i " } ;
*/
/* we have to use Cyrillic letters because latin-1 always gets copied */
const char rule [ ] = " & \\ u0452 < \\ u0434 < \\ u0433 < \\ u0432 " ; /* &dje < d < g < v */
const char * wUCA [ ] = { " \\ u0430 " , " \\ u0452 " , " \\ u0434 " , " \\ u0433 " , " \\ u0432 " , " \\ u0435 " } ; /* a, dje, d, g, v, e */
const char * noUCA [ ] = { " \\ u0434 " , " \\ u0433 " , " \\ u0432 " , " \\ u0430 " , " \\ u0435 " , " \\ u0452 " } ; /* d, g, v, a, e, dje */
2005-07-06 21:27:21 +00:00
2007-06-13 22:53:28 +00:00
UChar uRules [ 256 ] ;
int32_t uRulesLen = u_unescape ( rule , uRules , 256 ) ;
2005-07-06 21:27:21 +00:00
2007-06-13 22:53:28 +00:00
UCollator * coll = ucol_openRules ( uRules , uRulesLen , UCOL_DEFAULT , UCOL_DEFAULT , NULL , & status ) ;
2007-12-07 10:49:34 +00:00
UCollator * UCA = NULL ;
2007-06-13 22:53:28 +00:00
UCollator * cloneNOUCA = NULL , * cloneWUCA = NULL ;
2005-07-06 21:27:21 +00:00
2007-06-13 22:53:28 +00:00
uint8_t imageBuffer [ 32768 ] ;
uint8_t * image = imageBuffer ;
int32_t imageBufferCapacity = 32768 ;
2005-07-06 21:27:21 +00:00
2007-06-13 22:53:28 +00:00
int32_t imageSize ;
2005-07-06 21:27:21 +00:00
2007-12-07 10:49:34 +00:00
if ( ( coll = = NULL ) | | ( U_FAILURE ( status ) ) ) {
2007-06-13 22:53:28 +00:00
log_data_err ( " could not load collators or error occured: %s \n " ,
u_errorName ( status ) ) ;
return ;
}
2007-12-07 10:49:34 +00:00
UCA = ucol_open ( " root " , & status ) ;
if ( ( UCA = = NULL ) | | ( U_FAILURE ( status ) ) ) {
log_data_err ( " could not load UCA collator or error occured: %s \n " ,
u_errorName ( status ) ) ;
return ;
}
2007-06-13 22:53:28 +00:00
imageSize = ucol_cloneBinary ( coll , image , imageBufferCapacity , & status ) ;
if ( U_FAILURE ( status ) ) {
image = ( uint8_t * ) malloc ( imageSize * sizeof ( uint8_t ) ) ;
status = U_ZERO_ERROR ;
imageSize = ucol_cloneBinary ( coll , imageBuffer , imageSize , & status ) ;
}
2005-07-06 21:27:21 +00:00
2007-06-13 22:53:28 +00:00
cloneWUCA = ucol_openBinary ( image , imageSize , UCA , & status ) ;
cloneNOUCA = ucol_openBinary ( image , imageSize , NULL , & status ) ;
2005-07-06 21:27:21 +00:00
2007-06-13 22:53:28 +00:00
genericOrderingTest ( coll , wUCA , sizeof ( wUCA ) / sizeof ( wUCA [ 0 ] ) ) ;
genericOrderingTest ( cloneWUCA , wUCA , sizeof ( wUCA ) / sizeof ( wUCA [ 0 ] ) ) ;
genericOrderingTest ( cloneNOUCA , noUCA , sizeof ( noUCA ) / sizeof ( noUCA [ 0 ] ) ) ;
if ( image ! = imageBuffer ) {
free ( image ) ;
}
ucol_close ( coll ) ;
ucol_close ( cloneNOUCA ) ;
ucol_close ( cloneWUCA ) ;
ucol_close ( UCA ) ;
}
static void TestDefault ( void ) {
/* Tests for code coverage. */
UErrorCode status = U_ZERO_ERROR ;
UCollator * coll = ucol_open ( " es@collation=pinyin " , & status ) ;
if ( status ! = U_USING_DEFAULT_WARNING ) {
/* What do you mean that you know about using pinyin collation in Spanish!? This should be in the zh locale. */
log_err ( " es@collation=pinyin should return U_USING_DEFAULT_WARNING, but returned %s \n " , u_errorName ( status ) ) ;
}
ucol_close ( coll ) ;
if ( ucol_getKeywordValues ( " funky " , & status ) ! = NULL ) {
log_err ( " Collators should not know about the funky keyword. \n " ) ;
}
if ( status ! = U_ILLEGAL_ARGUMENT_ERROR ) {
log_err ( " funky keyword didn't fail as expected %s \n " , u_errorName ( status ) ) ;
}
if ( ucol_getKeywordValues ( " collation " , & status ) ! = NULL ) {
log_err ( " ucol_getKeywordValues should not work when given a bad status. \n " ) ;
}
2005-07-06 21:27:21 +00:00
}
2008-11-17 20:27:25 +00:00
static void TestDefaultKeyword ( void ) {
/* Tests for code coverage. */
UErrorCode status = U_ZERO_ERROR ;
const char * loc = " zh_TW@collation=default " ;
UCollator * coll = ucol_open ( loc , & status ) ;
if ( U_FAILURE ( status ) ) {
log_info ( " Warning: ucol_open(%s, ...) returned %s, at least it didn't crash. \n " , loc , u_errorName ( status ) ) ;
2008-11-17 21:46:15 +00:00
} else if ( status ! = U_USING_FALLBACK_WARNING ) {
log_err ( " ucol_open(%s, ...) should return an error or some sort of U_USING_FALLBACK_WARNING, but returned %s \n " , loc , u_errorName ( status ) ) ;
2008-11-17 20:27:25 +00:00
}
ucol_close ( coll ) ;
}
2009-03-09 20:39:13 +00:00
static void TestGetKeywordValuesForLocale ( void ) {
# define PREFERRED_SIZE 16
# define MAX_NUMBER_OF_KEYWORDS 6
const char * PREFERRED [ PREFERRED_SIZE ] [ MAX_NUMBER_OF_KEYWORDS + 1 ] = {
{ " und " , " standard " , NULL , NULL , NULL , NULL , NULL } ,
{ " en_US " , " standard " , NULL , NULL , NULL , NULL , NULL } ,
{ " en_029 " , " standard " , NULL , NULL , NULL , NULL , NULL } ,
{ " de_DE " , " standard " , " phonebook " , NULL , NULL , NULL , NULL } ,
{ " de_Latn_DE " , " standard " , " phonebook " , NULL , NULL , NULL , NULL } ,
{ " zh " , " pinyin " , " big5han " , " gb2312han " , " standard " , " stroke " , " unihan " } ,
{ " zh_Hans " , " pinyin " , " big5han " , " gb2312han " , " standard " , " stroke " , " unihan " } ,
{ " zh_CN " , " pinyin " , " big5han " , " gb2312han " , " standard " , " stroke " , " unihan " } ,
{ " zh_Hant " , " stroke " , " big5han " , " gb2312han " , " pinyin " , " standard " , " unihan " } ,
{ " zh_TW " , " stroke " , " big5han " , " gb2312han " , " pinyin " , " standard " , " unihan " } ,
{ " zh__PINYIN " , " pinyin " , " big5han " , " gb2312han " , " standard " , " stroke " , " unihan " } ,
{ " es_ES " , " standard " , " traditional " , NULL , NULL , NULL , NULL } ,
{ " es__TRADITIONAL " , " traditional " , " standard " , NULL , NULL , NULL , NULL } ,
{ " und@collation=phonebook " , " standard " , NULL , NULL , NULL , NULL , NULL } ,
{ " de_DE@collation=big5han " , " standard " , " phonebook " , NULL , NULL , NULL , NULL } ,
{ " zzz@collation=xxx " , " standard " , NULL , NULL , NULL , NULL , NULL }
} ;
const int32_t expectedLength [ PREFERRED_SIZE ] = { 1 , 1 , 1 , 2 , 2 , 6 , 6 , 6 , 6 , 6 , 6 , 2 , 2 , 1 , 2 , 1 } ;
UErrorCode status = U_ZERO_ERROR ;
UEnumeration * keywordValues = NULL ;
int32_t i , n ;
UBool errorOccurred = FALSE ;
for ( i = 0 ; i < PREFERRED_SIZE ; i + + ) {
const char * locale = PREFERRED [ i ] [ 0 ] ;
const char * value = NULL ;
int32_t valueLength = 0 ;
int32_t size = 0 ;
keywordValues = ucol_getKeywordValuesForLocale ( " collation " , locale , TRUE , & status ) ;
if ( keywordValues = = NULL | | U_FAILURE ( status ) ) {
log_err ( " Error getting keyword values: %s \n " , u_errorName ( status ) ) ;
break ;
}
size = uenum_count ( keywordValues , & status ) ;
if ( size = = expectedLength [ i ] ) {
for ( n = 0 ; n < expectedLength [ i ] ; n + + ) {
if ( ( value = uenum_next ( keywordValues , valueLength , & status ) ) ! = NULL & & U_SUCCESS ( status ) ) {
if ( uprv_strcmp ( value , PREFERRED [ i ] [ n + 1 ] ) ! = 0 ) {
log_err ( " Keyword values differ: Got [%s] Expected [%s] for locale: %s \n " , value , PREFERRED [ i ] [ n + 1 ] , locale ) ;
errorOccurred = TRUE ;
break ;
}
} else {
log_err ( " While getting keyword value from locale: %s got this error: %s \n " , locale , u_errorName ( status ) ) ;
errorOccurred = TRUE ;
break ;
}
}
if ( errorOccurred ) {
break ;
}
} else {
log_err ( " Number of keywords (%d) does not match expected size (%d) for locale: %s \n " , size , expectedLength [ i ] , locale ) ;
break ;
}
uenum_close ( keywordValues ) ;
keywordValues = NULL ;
}
if ( keywordValues ! = NULL ) {
uenum_close ( keywordValues ) ;
}
}
2008-11-17 20:27:25 +00:00
2005-07-14 20:55:39 +00:00
# endif /* #if !UCONFIG_NO_COLLATION */