2000-01-15 02:00:06 +00:00
|
|
|
/********************************************************************
|
|
|
|
* COPYRIGHT:
|
|
|
|
* Copyright (c) 1997-1999, International Business Machines Corporation and
|
2000-12-12 20:33:54 +00:00
|
|
|
* others. All Rights Reserved.
|
2000-01-15 02:00:06 +00:00
|
|
|
********************************************************************/
|
1999-08-16 21:50:52 +00:00
|
|
|
#ifndef _COLL
|
1999-12-28 23:57:50 +00:00
|
|
|
#include "unicode/coll.h"
|
1999-08-16 21:50:52 +00:00
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifndef _TBLCOLL
|
1999-12-28 23:57:50 +00:00
|
|
|
#include "unicode/tblcoll.h"
|
1999-08-16 21:50:52 +00:00
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifndef _UNISTR
|
1999-12-28 23:57:50 +00:00
|
|
|
#include "unicode/unistr.h"
|
1999-08-16 21:50:52 +00:00
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifndef _SORTKEY
|
1999-12-28 23:57:50 +00:00
|
|
|
#include "unicode/sortkey.h"
|
1999-08-16 21:50:52 +00:00
|
|
|
#endif
|
|
|
|
|
|
|
|
#ifndef _JACOLL
|
|
|
|
#include "jacoll.h"
|
|
|
|
#endif
|
|
|
|
|
2000-12-12 19:40:58 +00:00
|
|
|
#include "sfwdchit.h"
|
|
|
|
|
1999-08-16 21:50:52 +00:00
|
|
|
CollationKanaTest::CollationKanaTest()
|
|
|
|
: myCollation(0)
|
|
|
|
{
|
1999-10-07 00:07:53 +00:00
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
1999-08-16 21:50:52 +00:00
|
|
|
myCollation = Collator::createInstance(Locale::JAPAN, status);
|
2001-02-17 17:35:19 +00:00
|
|
|
if(!myCollation || U_FAILURE(status)) {
|
|
|
|
errln(__FILE__ "failed to create! err " + UnicodeString(u_errorName(status)));
|
|
|
|
/* if it wasn't already: */
|
|
|
|
delete myCollation;
|
|
|
|
myCollation = NULL;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
1999-08-16 21:50:52 +00:00
|
|
|
myCollation->setDecomposition(Normalizer::DECOMP);
|
|
|
|
}
|
|
|
|
|
|
|
|
CollationKanaTest::~CollationKanaTest()
|
|
|
|
{
|
|
|
|
delete myCollation;
|
|
|
|
}
|
|
|
|
|
|
|
|
const UChar CollationKanaTest::testSourceCases[][CollationKanaTest::MAX_TOKEN_LEN] = {
|
2001-03-16 03:04:37 +00:00
|
|
|
{0xff9E, 0x0000},
|
|
|
|
{0x3042, 0x0000},
|
|
|
|
{0x30A2, 0x0000},
|
|
|
|
{0x3042, 0x3042, 0x0000},
|
|
|
|
{0x30A2, 0x30FC, 0x0000},
|
|
|
|
{0x30A2, 0x30FC, 0x30C8, 0x0000} /* 6 */
|
1999-08-16 21:50:52 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
const UChar CollationKanaTest::testTargetCases[][CollationKanaTest::MAX_TOKEN_LEN] = {
|
2001-03-16 03:04:37 +00:00
|
|
|
{0xFF9F, 0x0000},
|
|
|
|
{0x30A2, 0x0000},
|
|
|
|
{0x3042, 0x3042, 0x0000},
|
|
|
|
{0x30A2, 0x30FC, 0x0000},
|
|
|
|
{0x30A2, 0x30FC, 0x30C8, 0x0000},
|
|
|
|
{0x3042, 0x3042, 0x3068, 0x0000} /* 6 */
|
1999-08-16 21:50:52 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
const Collator::EComparisonResult CollationKanaTest::results[] = {
|
|
|
|
Collator::LESS,
|
|
|
|
Collator::LESS,
|
|
|
|
Collator::LESS,
|
2001-03-16 03:04:37 +00:00
|
|
|
Collator::LESS,
|
|
|
|
Collator::LESS,
|
|
|
|
Collator::GREATER
|
1999-08-16 21:50:52 +00:00
|
|
|
};
|
|
|
|
|
2001-03-20 00:26:15 +00:00
|
|
|
const UChar CollationKanaTest::testBaseCases[][CollationKanaTest::MAX_TOKEN_LEN] = {
|
|
|
|
{0x30AB, 0x0000},
|
|
|
|
{0x30AB, 0x30AD, 0x0000},
|
|
|
|
{0x30AD, 0x0000},
|
|
|
|
{0x30AD, 0x30AD, 0x0000}
|
|
|
|
};
|
|
|
|
|
|
|
|
const UChar CollationKanaTest::testPlainDakutenHandakutenCases[][CollationKanaTest::MAX_TOKEN_LEN] = {
|
|
|
|
{0x30CF, 0x30AB, 0x0000},
|
|
|
|
{0x30D0, 0x30AB, 0x0000},
|
|
|
|
{0x30CF, 0x30AD, 0x0000},
|
|
|
|
{0x30D0, 0x30AD, 0x0000}
|
|
|
|
};
|
|
|
|
|
|
|
|
const UChar CollationKanaTest::testSmallLargeCases[][CollationKanaTest::MAX_TOKEN_LEN] = {
|
|
|
|
{0x30C3, 0x30CF, 0x0000},
|
|
|
|
{0x30C4, 0x30CF, 0x0000},
|
|
|
|
{0x30C3, 0x30D0, 0x0000},
|
|
|
|
{0x30C4, 0x30D0, 0x0000}
|
|
|
|
};
|
|
|
|
|
|
|
|
const UChar CollationKanaTest::testKatakanaHiraganaCases[][CollationKanaTest::MAX_TOKEN_LEN] = {
|
|
|
|
{0x3042, 0x30C3, 0x0000},
|
|
|
|
{0x30A2, 0x30C3, 0x0000},
|
|
|
|
{0x3042, 0x30C4, 0x0000},
|
|
|
|
{0x30A2, 0x30C4, 0x0000}
|
|
|
|
};
|
|
|
|
|
|
|
|
const UChar CollationKanaTest::testChooonKigooCases[][CollationKanaTest::MAX_TOKEN_LEN] = {
|
|
|
|
/*0*/ {0x30AB, 0x30FC, 0x3042, 0x0000},
|
|
|
|
/*1*/ {0x30AB, 0x30FC, 0x30A2, 0x0000},
|
|
|
|
/*2*/ {0x30AB, 0x30A4, 0x3042, 0x0000},
|
|
|
|
/*3*/ {0x30AB, 0x30A4, 0x30A2, 0x0000},
|
|
|
|
/*4*/ {0x30AD, 0x30A4, 0x3042, 0x0000},
|
|
|
|
/*5*/ {0x30AD, 0x30A4, 0x30A2, 0x0000},
|
|
|
|
/*6*/ {0x30AD, 0x30FC, 0x3042, 0x0000},
|
|
|
|
/*7*/ {0x30AD, 0x30FC, 0x30A2, 0x0000}
|
|
|
|
};
|
|
|
|
|
1999-08-16 21:50:52 +00:00
|
|
|
void CollationKanaTest::doTest( UnicodeString source, UnicodeString target, Collator::EComparisonResult result)
|
|
|
|
{
|
|
|
|
Collator::EComparisonResult compareResult = myCollation->compare(source, target);
|
2000-12-12 20:33:54 +00:00
|
|
|
SimpleFwdCharIterator src(source);
|
|
|
|
SimpleFwdCharIterator trg(target);
|
|
|
|
Collator::EComparisonResult incResult = myCollation->compare(src, trg);
|
1999-08-16 21:50:52 +00:00
|
|
|
CollationKey sortKey1, sortKey2;
|
1999-10-07 00:07:53 +00:00
|
|
|
UErrorCode key1status = U_ZERO_ERROR, key2status = U_ZERO_ERROR; //nos
|
1999-08-16 21:50:52 +00:00
|
|
|
myCollation->getCollationKey(source, /*nos*/ sortKey1, key1status );
|
|
|
|
myCollation->getCollationKey(target, /*nos*/ sortKey2, key2status );
|
1999-10-18 22:48:32 +00:00
|
|
|
if (U_FAILURE(key1status) || U_FAILURE(key2status)) {
|
1999-08-16 21:50:52 +00:00
|
|
|
errln("SortKey generation Failed.\n");
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
Collator::EComparisonResult keyResult = sortKey1.compareTo(sortKey2);
|
2000-12-12 19:40:58 +00:00
|
|
|
reportCResult( source, target, sortKey1, sortKey2, compareResult, keyResult, incResult, result );
|
1999-08-16 21:50:52 +00:00
|
|
|
}
|
|
|
|
|
2000-08-23 19:11:16 +00:00
|
|
|
void CollationKanaTest::TestTertiary(/* char* par */)
|
1999-08-16 21:50:52 +00:00
|
|
|
{
|
|
|
|
int32_t i = 0;
|
2001-03-16 03:04:37 +00:00
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
1999-08-16 21:50:52 +00:00
|
|
|
myCollation->setStrength(Collator::TERTIARY);
|
2001-03-16 03:04:37 +00:00
|
|
|
/* for one case, strcollinc fails, since it doesn't have good handling of contractions*/
|
|
|
|
/* normalization is turned off to stop strcollinc from executing */
|
|
|
|
myCollation->setAttribute(UCOL_NORMALIZATION_MODE, UCOL_ON, status);
|
|
|
|
myCollation->setAttribute(UCOL_CASE_LEVEL, UCOL_ON, status);
|
|
|
|
for (i = 0; i < 6; i++) {
|
1999-08-16 21:50:52 +00:00
|
|
|
doTest(testSourceCases[i], testTargetCases[i], results[i]);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2001-03-20 00:26:15 +00:00
|
|
|
/* Testing base letters */
|
|
|
|
void CollationKanaTest::TestBase()
|
|
|
|
{
|
|
|
|
int32_t i;
|
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
|
|
myCollation->setStrength(Collator::PRIMARY);
|
|
|
|
for (i = 0; i < 3 ; i++)
|
|
|
|
doTest(testBaseCases[i], testBaseCases[i + 1], Collator::LESS);
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Testing plain, Daku-ten, Handaku-ten letters */
|
|
|
|
void CollationKanaTest::TestPlainDakutenHandakuten(void)
|
|
|
|
{
|
|
|
|
int32_t i;
|
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
|
|
myCollation->setStrength(Collator::SECONDARY);
|
|
|
|
for (i = 0; i < 3 ; i++)
|
|
|
|
doTest(testPlainDakutenHandakutenCases[i], testPlainDakutenHandakutenCases[i + 1],
|
|
|
|
Collator::LESS);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Test Small, Large letters
|
|
|
|
*/
|
|
|
|
void CollationKanaTest::TestSmallLarge(void)
|
|
|
|
{
|
|
|
|
int32_t i;
|
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
|
|
myCollation->setStrength(Collator::TERTIARY);
|
|
|
|
myCollation->setAttribute(UCOL_CASE_LEVEL, UCOL_ON, status);
|
|
|
|
for (i = 0; i < 3 ; i++)
|
|
|
|
doTest(testSmallLargeCases[i], testSmallLargeCases[i + 1], Collator::LESS);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Test Katakana, Hiragana letters
|
|
|
|
*/
|
|
|
|
void CollationKanaTest::TestKatakanaHiragana(void)
|
|
|
|
{
|
|
|
|
int32_t i;
|
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
|
|
myCollation->setStrength(Collator::QUATERNARY);
|
|
|
|
myCollation->setAttribute(UCOL_CASE_LEVEL, UCOL_ON, status);
|
|
|
|
for (i = 0; i < 3 ; i++) {
|
|
|
|
doTest(testKatakanaHiraganaCases[i], testKatakanaHiraganaCases[i + 1],
|
|
|
|
Collator::LESS);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Test Choo-on kigoo
|
|
|
|
*/
|
|
|
|
void CollationKanaTest::TestChooonKigoo(void)
|
|
|
|
{
|
|
|
|
int32_t i;
|
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
|
|
myCollation->setAttribute(UCOL_CASE_LEVEL, UCOL_ON, status);
|
|
|
|
for (i = 0; i < 7 ; i++) {
|
|
|
|
doTest(testChooonKigooCases[i], testChooonKigooCases[i + 1], Collator::LESS);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
2000-08-23 19:11:16 +00:00
|
|
|
void CollationKanaTest::runIndexedTest( int32_t index, UBool exec, const char* &name, char* /*par*/ )
|
1999-08-16 21:50:52 +00:00
|
|
|
{
|
|
|
|
if (exec) logln("TestSuite CollationKanaTest: ");
|
|
|
|
switch (index) {
|
2000-08-23 19:11:16 +00:00
|
|
|
case 0: name = "TestTertiary"; if (exec) TestTertiary(/* par */); break;
|
2001-03-20 00:26:15 +00:00
|
|
|
case 1: name = "TestBase"; if (exec) TestBase(/* par */); break;
|
|
|
|
case 2: name = "TestSmallLarge"; if (exec) TestSmallLarge(/* par */); break;
|
|
|
|
case 3: name = "TestTestPlainDakutenHandakuten"; if (exec) TestPlainDakutenHandakuten(/* par */); break;
|
|
|
|
case 4: name = "TestKatakanaHiragana"; if (exec) TestKatakanaHiragana(/* par */); break;
|
|
|
|
case 5: name = "TestChooonKigoo"; if (exec) TestChooonKigoo(/* par */); break;
|
1999-08-16 21:50:52 +00:00
|
|
|
default: name = ""; break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|