993 lines
37 KiB
C++
993 lines
37 KiB
C++
// © 2016 and later: Unicode, Inc. and others.
|
|
// License & terms of use: http://www.unicode.org/copyright.html
|
|
/************************************************************************
|
|
* COPYRIGHT:
|
|
* Copyright (c) 2000-2016, International Business Machines Corporation
|
|
* and others. All Rights Reserved.
|
|
************************************************************************/
|
|
/************************************************************************
|
|
* Date Name Description
|
|
* 1/03/2000 Madhu Creation.
|
|
************************************************************************/
|
|
|
|
#include "unicode/utypes.h"
|
|
|
|
#if !UCONFIG_NO_TRANSLITERATION
|
|
|
|
#include "ittrans.h"
|
|
#include "transapi.h"
|
|
#include "unicode/utypes.h"
|
|
#include "unicode/translit.h"
|
|
#include "unicode/unifilt.h"
|
|
#include "cpdtrans.h"
|
|
#include "cmemory.h"
|
|
#include <string.h>
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include "unicode/rep.h"
|
|
#include "unicode/locid.h"
|
|
#include "unicode/uniset.h"
|
|
|
|
int32_t getInt(UnicodeString str)
|
|
{
|
|
char buffer[20];
|
|
int len=str.length();
|
|
if(len>=20) {
|
|
len=19;
|
|
}
|
|
str.extract(0, len, buffer, "");
|
|
buffer[len]=0;
|
|
return atoi(buffer);
|
|
}
|
|
|
|
//---------------------------------------------
|
|
// runIndexedTest
|
|
//---------------------------------------------
|
|
|
|
void
|
|
TransliteratorAPITest::runIndexedTest(int32_t index, UBool exec,
|
|
const char* &name, char* /*par*/) {
|
|
switch (index) {
|
|
TESTCASE(0,TestgetInverse);
|
|
TESTCASE(1,TestgetID);
|
|
TESTCASE(2,TestGetDisplayName);
|
|
TESTCASE(3,TestTransliterate1);
|
|
TESTCASE(4,TestTransliterate2);
|
|
TESTCASE(5,TestTransliterate3);
|
|
TESTCASE(6,TestSimpleKeyboardTransliterator);
|
|
TESTCASE(7,TestKeyboardTransliterator1);
|
|
TESTCASE(8,TestKeyboardTransliterator2);
|
|
TESTCASE(9,TestKeyboardTransliterator3);
|
|
TESTCASE(10,TestGetAdoptFilter);
|
|
TESTCASE(11,TestClone);
|
|
TESTCASE(12,TestNullTransliterator);
|
|
TESTCASE(13,TestRegisterUnregister);
|
|
TESTCASE(14,TestUnicodeFunctor);
|
|
default: name = ""; break;
|
|
}
|
|
}
|
|
|
|
|
|
void TransliteratorAPITest::TestgetID() {
|
|
UnicodeString trans="Latin-Greek";
|
|
UnicodeString ID;
|
|
UParseError parseError;
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
Transliterator* t= Transliterator::createInstance(trans, UTRANS_FORWARD, parseError, status);
|
|
if(t==0 || U_FAILURE(status)){
|
|
dataerrln("FAIL: construction of Latin-Greek - %s",u_errorName(status));
|
|
return;
|
|
}else{
|
|
ID= t->getID();
|
|
if(ID != trans)
|
|
errln("FAIL: getID returned " + ID + " instead of Latin-Greek");
|
|
delete t;
|
|
}
|
|
int i;
|
|
for (i=0; i<Transliterator::countAvailableIDs(); i++){
|
|
status = U_ZERO_ERROR;
|
|
ID = (UnicodeString) Transliterator::getAvailableID(i);
|
|
if(ID.indexOf("Thai")>-1){
|
|
continue;
|
|
}
|
|
t = Transliterator::createInstance(ID, UTRANS_FORWARD, parseError, status);
|
|
if(t == 0){
|
|
errln("FAIL: " + ID);
|
|
continue;
|
|
}
|
|
if(ID != t->getID())
|
|
errln("FAIL: getID() returned " + t->getID() + " instead of " + ID);
|
|
delete t;
|
|
}
|
|
ID=(UnicodeString)Transliterator::getAvailableID(i);
|
|
if(ID != (UnicodeString)Transliterator::getAvailableID(0)){
|
|
errln("FAIL: calling getAvailableID(index > coundAvailableIDs) should make index=0\n");
|
|
}
|
|
|
|
Transliterator* t1=Transliterator::createInstance("Latin-Devanagari", UTRANS_FORWARD, parseError, status);
|
|
Transliterator* t2=Transliterator::createInstance("Latin-Greek", UTRANS_FORWARD, parseError, status);
|
|
if(t1 ==0 || t2 == 0){
|
|
errln("FAIL: construction");
|
|
return;
|
|
}
|
|
Transliterator* t3=t1->clone();
|
|
Transliterator* t4=t2->clone();
|
|
|
|
if(t1->getID() != t3->getID() || t2->getID() != t4->getID() ||
|
|
t1->getID() == t4->getID() || t2->getID() == t3->getID() ||
|
|
t1->getID()== t4->getID() )
|
|
errln("FAIL: getID or clone failed");
|
|
|
|
|
|
Transliterator* t5=Transliterator::createInstance("Latin-Devanagari", UTRANS_FORWARD, parseError, status);
|
|
if(t5 == 0)
|
|
errln("FAIL: construction");
|
|
else if(t1->getID() != t5->getID() || t5->getID() != t3->getID() || t1->getID() != t3->getID())
|
|
errln("FAIL: getID or clone failed");
|
|
|
|
|
|
delete t1;
|
|
delete t2;
|
|
delete t3;
|
|
delete t4;
|
|
delete t5;
|
|
}
|
|
|
|
void TransliteratorAPITest::TestgetInverse() {
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
UParseError parseError;
|
|
Transliterator* t1 = Transliterator::createInstance("Katakana-Latin", UTRANS_FORWARD, parseError, status);
|
|
Transliterator* invt1 = Transliterator::createInstance("Latin-Katakana", UTRANS_FORWARD, parseError, status);
|
|
Transliterator* t2 = Transliterator::createInstance("Latin-Devanagari", UTRANS_FORWARD, parseError, status);
|
|
Transliterator* invt2 = Transliterator::createInstance("Devanagari-Latin", UTRANS_FORWARD, parseError, status);
|
|
if(t1 == 0 || invt1 == 0 || t2 == 0 || invt2 == 0) {
|
|
dataerrln("FAIL: in instantiation - %s", u_errorName(status));
|
|
return;
|
|
}
|
|
|
|
Transliterator* inverse1=t1->createInverse(status);
|
|
Transliterator* inverse2=t2->createInverse(status);
|
|
if(inverse1->getID() != invt1->getID() || inverse2->getID() != invt2->getID()
|
|
|| inverse1->getID() == invt2->getID() || inverse2->getID() == invt1->getID() )
|
|
errln("FAIL: getInverse() ");
|
|
|
|
UnicodeString TransID[]={
|
|
"Halfwidth-Fullwidth",
|
|
"Fullwidth-Halfwidth",
|
|
"Greek-Latin" ,
|
|
"Latin-Greek",
|
|
//"Arabic-Latin", // removed in 2.0
|
|
//"Latin-Arabic",
|
|
"Katakana-Latin",
|
|
"Latin-Katakana",
|
|
//"Hebrew-Latin", // removed in 2.0
|
|
//"Latin-Hebrew",
|
|
"Cyrillic-Latin",
|
|
"Latin-Cyrillic",
|
|
"Devanagari-Latin",
|
|
"Latin-Devanagari",
|
|
"Any-Hex",
|
|
"Hex-Any"
|
|
};
|
|
for(uint32_t i=0; i<UPRV_LENGTHOF(TransID); i=i+2){
|
|
Transliterator *trans1=Transliterator::createInstance(TransID[i], UTRANS_FORWARD, parseError, status);
|
|
if(t1 == 0){
|
|
errln("FAIL: in instantiation for" + TransID[i]);
|
|
continue;
|
|
}
|
|
Transliterator *inver1=trans1->createInverse(status);
|
|
if(inver1->getID() != TransID[i+1] )
|
|
errln("FAIL :getInverse() for " + TransID[i] + " returned " + inver1->getID() + " instead of " + TransID[i+1]);
|
|
delete inver1;
|
|
delete trans1;
|
|
}
|
|
delete t1;
|
|
delete t2;
|
|
delete invt1;
|
|
delete invt2;
|
|
delete inverse1;
|
|
delete inverse2;
|
|
|
|
}
|
|
|
|
void TransliteratorAPITest::TestClone(){
|
|
Transliterator *t1, *t2, *t3, *t4;
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
UParseError parseError;
|
|
t1=Transliterator::createInstance("Latin-Devanagari", UTRANS_FORWARD, parseError, status);
|
|
t2=Transliterator::createInstance("Latin-Greek", UTRANS_FORWARD, parseError, status);
|
|
if(t1 == 0 || t2 == 0){
|
|
dataerrln("FAIL: construction - %s", u_errorName(status));
|
|
return;
|
|
}
|
|
t3=t1->clone();
|
|
t4=t2->clone();
|
|
|
|
if(t1->getID() != t3->getID() || t2->getID() != t4->getID() )
|
|
errln("FAIL: clone or getID failed");
|
|
if(t1->getID()==t4->getID() || t2->getID()==t3->getID() || t1->getID()==t4->getID())
|
|
errln("FAIL: clone or getID failed");
|
|
|
|
delete t1;
|
|
delete t2;
|
|
delete t3;
|
|
delete t4;
|
|
|
|
}
|
|
|
|
void TransliteratorAPITest::TestGetDisplayName() {
|
|
UnicodeString dispNames[]= {
|
|
//ID, displayName
|
|
//"CurlyQuotes-StraightQuotes" ,"CurlyQuotes to StraightQuotes",
|
|
"Any-Hex" ,"Any to Hex Escape",
|
|
"Halfwidth-Fullwidth" ,"Halfwidth to Fullwidth" ,
|
|
//"Latin-Arabic" ,"Latin to Arabic" ,
|
|
"Latin-Devanagari" ,"Latin to Devanagari" ,
|
|
"Greek-Latin" ,"Greek to Latin" ,
|
|
//"Arabic-Latin" ,"Arabic to Latin" ,
|
|
"Hex-Any" ,"Hex Escape to Any",
|
|
"Cyrillic-Latin" ,"Cyrillic to Latin" ,
|
|
"Latin-Greek" ,"Latin to Greek" ,
|
|
"Latin-Katakana" ,"Latin to Katakana" ,
|
|
//"Latin-Hebrew" ,"Latin to Hebrew" ,
|
|
"Katakana-Latin" ,"Katakana to Latin"
|
|
};
|
|
UnicodeString name="";
|
|
Transliterator* t;
|
|
UnicodeString message;
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
UParseError parseError;
|
|
|
|
#if UCONFIG_NO_FORMATTING
|
|
logln("Skipping, UCONFIG_NO_FORMATTING is set\n");
|
|
return;
|
|
#else
|
|
|
|
for (uint32_t i=0; i<UPRV_LENGTHOF(dispNames); i=i+2 ) {
|
|
t = Transliterator::createInstance(dispNames[i+0], UTRANS_FORWARD, parseError, status);
|
|
if(t==0){
|
|
dataerrln("FAIL: construction: " + dispNames[i+0] + " - " + u_errorName(status));
|
|
status = U_ZERO_ERROR;
|
|
continue;
|
|
}
|
|
t->getDisplayName(t->getID(), name);
|
|
message="Display name for ID:" + t->getID();
|
|
// doTest(message, name, dispNames[i+1]); //!!! This will obviously fail for any locale other than english and its children!!!
|
|
name="";
|
|
t->getDisplayName(t->getID(), Locale::getUS(), name);
|
|
message.remove();
|
|
message.append("Display name for on english locale ID:");
|
|
message.append(t->getID());
|
|
// message="Display name for on english locale ID:" + t->getID();
|
|
doTest(message, name, dispNames[i+1]);
|
|
name="";
|
|
|
|
delete t;
|
|
}
|
|
#endif
|
|
|
|
}
|
|
|
|
void TransliteratorAPITest::TestTransliterate1(){
|
|
|
|
UnicodeString Data[]={
|
|
//ID, input string, transliterated string
|
|
"Any-Hex", "hello", UnicodeString("\\u0068\\u0065\\u006C\\u006C\\u006F", "") ,
|
|
"Hex-Any", UnicodeString("\\u0068\\u0065\\u006C\\u006C\\u006F", ""), "hello" ,
|
|
"Latin-Devanagari",CharsToUnicodeString("bha\\u0304rata"), CharsToUnicodeString("\\u092D\\u093E\\u0930\\u0924") ,
|
|
"Latin-Devanagari",UnicodeString("kra ksha khra gra cra dya dhya",""), CharsToUnicodeString("\\u0915\\u094D\\u0930 \\u0915\\u094D\\u0936 \\u0916\\u094D\\u0930 \\u0917\\u094D\\u0930 \\u091a\\u094D\\u0930 \\u0926\\u094D\\u092F \\u0927\\u094D\\u092F") ,
|
|
|
|
"Devanagari-Latin", CharsToUnicodeString("\\u092D\\u093E\\u0930\\u0924"), CharsToUnicodeString("bh\\u0101rata"),
|
|
// "Contracted-Expanded", CharsToUnicodeString("\\u00C0\\u00C1\\u0042"), CharsToUnicodeString("\\u0041\\u0300\\u0041\\u0301\\u0042") ,
|
|
// "Expanded-Contracted", CharsToUnicodeString("\\u0041\\u0300\\u0041\\u0301\\u0042"), CharsToUnicodeString("\\u00C0\\u00C1\\u0042") ,
|
|
//"Latin-Arabic", "aap", CharsToUnicodeString("\\u0627\\u06A4") ,
|
|
//"Arabic-Latin", CharsToUnicodeString("\\u0627\\u06A4"), "aap"
|
|
};
|
|
|
|
UnicodeString gotResult;
|
|
UnicodeString temp;
|
|
UnicodeString message;
|
|
Transliterator* t;
|
|
logln("Testing transliterate");
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
UParseError parseError;
|
|
|
|
for(uint32_t i=0;i<UPRV_LENGTHOF(Data); i=i+3){
|
|
t=Transliterator::createInstance(Data[i+0], UTRANS_FORWARD, parseError, status);
|
|
if(t==0){
|
|
dataerrln("FAIL: construction: " + Data[i+0] + " Error: " + u_errorName(status));
|
|
dataerrln("PreContext: " + prettify(parseError.preContext) + " PostContext: " + prettify( parseError.postContext) );
|
|
status = U_ZERO_ERROR;
|
|
continue;
|
|
}
|
|
gotResult = Data[i+1];
|
|
t->transliterate(gotResult);
|
|
message=t->getID() + "->transliterate(UnicodeString, UnicodeString) for\n\t Source:" + prettify(Data[i+1]);
|
|
doTest(message, gotResult, Data[i+2]);
|
|
|
|
//doubt here
|
|
temp=Data[i+1];
|
|
t->transliterate(temp);
|
|
message.remove();
|
|
message.append(t->getID());
|
|
message.append("->transliterate(Replaceable) for \n\tSource:");
|
|
message.append(Data[i][1]);
|
|
doTest(message, temp, Data[i+2]);
|
|
|
|
callEverything(t, __LINE__);
|
|
delete t;
|
|
}
|
|
}
|
|
|
|
void TransliteratorAPITest::TestTransliterate2(){
|
|
//testing tranliterate(String text, int start, int limit, StringBuffer result)
|
|
UnicodeString Data2[]={
|
|
//ID, input string, start, limit, transliterated string
|
|
"Any-Hex", "hello! How are you?", "0", "5", UnicodeString("\\u0068\\u0065\\u006C\\u006C\\u006F", ""), UnicodeString("\\u0068\\u0065\\u006C\\u006C\\u006F! How are you?", "") ,
|
|
"Any-Hex", "hello! How are you?", "7", "12", UnicodeString("\\u0048\\u006F\\u0077\\u0020\\u0061", ""), UnicodeString("hello! \\u0048\\u006F\\u0077\\u0020\\u0061re you?", ""),
|
|
"Hex-Any", CharsToUnicodeString("\\u0068\\u0065\\u006C\\u006C\\u006F\\u0021\\u0020"), "0", "5", "hello", "hello! " ,
|
|
// "Contracted-Expanded", CharsToUnicodeString("\\u00C0\\u00C1\\u0042"), "1", "2", CharsToUnicodeString("\\u0041\\u0301"), CharsToUnicodeString("\\u00C0\\u0041\\u0301\\u0042") ,
|
|
"Devanagari-Latin", CharsToUnicodeString("\\u092D\\u093E\\u0930\\u0924"), "0", "1", "bha", CharsToUnicodeString("bha\\u093E\\u0930\\u0924") ,
|
|
"Devanagari-Latin", CharsToUnicodeString("\\u092D\\u093E\\u0930\\u0924"), "1", "2", CharsToUnicodeString("\\u0314\\u0101"), CharsToUnicodeString("\\u092D\\u0314\\u0101\\u0930\\u0924")
|
|
|
|
};
|
|
logln("\n Testing transliterate(String, int, int, StringBuffer)");
|
|
Transliterator* t;
|
|
UnicodeString gotResBuf;
|
|
UnicodeString temp;
|
|
int32_t start, limit;
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
UParseError parseError;
|
|
|
|
for(uint32_t i=0; i<UPRV_LENGTHOF(Data2); i=i+6){
|
|
t=Transliterator::createInstance(Data2[i+0], UTRANS_FORWARD, parseError, status);
|
|
if(t==0){
|
|
dataerrln("FAIL: construction: " + prettify(Data2[i+0]) + " - " + u_errorName(status));
|
|
continue;
|
|
}
|
|
start=getInt(Data2[i+2]);
|
|
limit=getInt(Data2[i+3]);
|
|
Data2[i+1].extractBetween(start, limit, gotResBuf);
|
|
t->transliterate(gotResBuf);
|
|
// errln("FAIL: calling transliterate on " + t->getID());
|
|
doTest(t->getID() + ".transliterate(UnicodeString, int32_t, int32_t, UnicodeString):(" + start + "," + limit + ") for \n\t source: " + prettify(Data2[i+1]), gotResBuf, Data2[i+4]);
|
|
|
|
temp=Data2[i+1];
|
|
t->transliterate(temp, start, limit);
|
|
doTest(t->getID() + ".transliterate(Replaceable, int32_t, int32_t, ):(" + start + "," + limit + ") for \n\t source: " + prettify(Data2[i+1]), temp, Data2[i+5]);
|
|
status = U_ZERO_ERROR;
|
|
callEverything(t, __LINE__);
|
|
delete t;
|
|
t = NULL;
|
|
}
|
|
|
|
status = U_ZERO_ERROR;
|
|
logln("\n Try calling transliterate with illegal start and limit values");
|
|
t=Transliterator::createInstance("Any-Hex", UTRANS_FORWARD, parseError, status);
|
|
if(U_FAILURE(status)) {
|
|
errln("Error creating transliterator %s", u_errorName(status));
|
|
delete t;
|
|
return;
|
|
}
|
|
gotResBuf = temp = "try start greater than limit";
|
|
t->transliterate(gotResBuf, 10, 5);
|
|
if(gotResBuf == temp) {
|
|
logln("OK: start greater than limit value handled correctly");
|
|
} else {
|
|
errln("FAIL: start greater than limit value returned" + gotResBuf);
|
|
}
|
|
|
|
callEverything(t, __LINE__);
|
|
delete t;
|
|
|
|
}
|
|
void TransliteratorAPITest::TestTransliterate3(){
|
|
UnicodeString rs="This is the replaceable String";
|
|
UnicodeString Data[] = {
|
|
"0", "0", "This is the replaceable String",
|
|
"2", "3", UnicodeString("Th\\u0069s is the replaceable String", ""),
|
|
"21", "23", UnicodeString("Th\\u0069s is the repl\\u0061\\u0063eable String", ""),
|
|
"14", "17", UnicodeString("Th\\u0069s is t\\u0068\\u0065\\u0020repl\\u0061\\u0063eable String", ""),
|
|
};
|
|
int start, limit;
|
|
UnicodeString message;
|
|
UParseError parseError;
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
Transliterator *t=Transliterator::createInstance("Any-Hex", UTRANS_FORWARD, parseError, status);
|
|
if(U_FAILURE(status)) {
|
|
errln("Error creating transliterator %s", u_errorName(status));
|
|
delete t;
|
|
return;
|
|
}
|
|
|
|
if(t == 0)
|
|
errln("FAIL : construction");
|
|
for(uint32_t i=0; i<UPRV_LENGTHOF(Data); i=i+3){
|
|
start=getInt(Data[i+0]);
|
|
limit=getInt(Data[i+1]);
|
|
t->transliterate(rs, start, limit);
|
|
message=t->getID() + ".transliterate(ReplaceableString, start, limit):("+start+","+limit+"):";
|
|
doTest(message, rs, Data[i+2]);
|
|
}
|
|
delete t;
|
|
}
|
|
|
|
void TransliteratorAPITest::TestSimpleKeyboardTransliterator(){
|
|
logln("simple call to transliterate");
|
|
UErrorCode status=U_ZERO_ERROR;
|
|
UParseError parseError;
|
|
Transliterator* t=Transliterator::createInstance("Any-Hex", UTRANS_FORWARD, parseError, status);
|
|
if(t == 0) {
|
|
UnicodeString context;
|
|
|
|
if (parseError.preContext[0]) {
|
|
context += (UnicodeString)" at " + parseError.preContext;
|
|
}
|
|
if (parseError.postContext[0]) {
|
|
context += (UnicodeString)" | " + parseError.postContext;
|
|
}
|
|
errln((UnicodeString)"FAIL: can't create Any-Hex, " +
|
|
(UnicodeString)u_errorName(status) + context);
|
|
return;
|
|
}
|
|
UTransPosition index={19,20,20,20};
|
|
UnicodeString rs= "Transliterate this-''";
|
|
UnicodeString insertion="abc";
|
|
UnicodeString expected=UnicodeString("Transliterate this-'\\u0061\\u0062\\u0063'", "");
|
|
t->transliterate(rs, index, insertion, status);
|
|
if(U_FAILURE(status))
|
|
errln("FAIL: " + t->getID()+ ".translitere(Replaceable, int[], UnicodeString, UErrorCode)-->" + (UnicodeString)u_errorName(status));
|
|
t->finishTransliteration(rs, index);
|
|
UnicodeString message="transliterate";
|
|
doTest(message, rs, expected);
|
|
|
|
logln("try calling transliterate with invalid index values");
|
|
UTransPosition index1[]={
|
|
//START, LIMIT, CURSOR
|
|
{10, 10, 12, 10}, //invalid since CURSOR>LIMIT valid:-START <= CURSOR <= LIMIT
|
|
{17, 16, 17, 17}, //invalid since START>LIMIT valid:-0<=START<=LIMIT
|
|
{-1, 16, 14, 16}, //invalid since START<0
|
|
{3, 50, 2, 50} //invalid since LIMIT>text.length()
|
|
};
|
|
for(uint32_t i=0; i<UPRV_LENGTHOF(index1); i++){
|
|
status=U_ZERO_ERROR;
|
|
t->transliterate(rs, index1[i], insertion, status);
|
|
if(status == U_ILLEGAL_ARGUMENT_ERROR)
|
|
logln("OK: invalid index values handled correctly");
|
|
else
|
|
errln("FAIL: invalid index values didn't throw U_ILLEGAL_ARGUMENT_ERROR throw" + (UnicodeString)u_errorName(status));
|
|
}
|
|
|
|
delete t;
|
|
}
|
|
void TransliteratorAPITest::TestKeyboardTransliterator1(){
|
|
UnicodeString Data[]={
|
|
//insertion, buffer
|
|
"a", UnicodeString("\\u0061", "") ,
|
|
"bbb", UnicodeString("\\u0061\\u0062\\u0062\\u0062", "") ,
|
|
"ca", UnicodeString("\\u0061\\u0062\\u0062\\u0062\\u0063\\u0061", "") ,
|
|
" ", UnicodeString("\\u0061\\u0062\\u0062\\u0062\\u0063\\u0061\\u0020", "") ,
|
|
"", UnicodeString("\\u0061\\u0062\\u0062\\u0062\\u0063\\u0061\\u0020", "") ,
|
|
|
|
"a", UnicodeString("\\u0061", "") ,
|
|
"b", UnicodeString("\\u0061\\u0062", "") ,
|
|
"z", UnicodeString("\\u0061\\u0062\\u007A", "") ,
|
|
"", UnicodeString("\\u0061\\u0062\\u007A", "")
|
|
|
|
};
|
|
UParseError parseError;
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
Transliterator* t=Transliterator::createInstance("Any-Hex", UTRANS_FORWARD, parseError, status);
|
|
if(U_FAILURE(status)) {
|
|
errln("Error creating transliterator %s", u_errorName(status));
|
|
delete t;
|
|
return;
|
|
}
|
|
//keyboardAux(t, Data);
|
|
UTransPosition index={0, 0, 0, 0};
|
|
UnicodeString s;
|
|
uint32_t i;
|
|
logln("Testing transliterate(Replaceable, int32_t, UnicodeString, UErrorCode)");
|
|
for (i=0; i<10; i=i+2) {
|
|
UnicodeString log;
|
|
if (Data[i+0] != "") {
|
|
log = s + " + " + Data[i+0] + " -> ";
|
|
t->transliterate(s, index, Data[i+0], status);
|
|
if(U_FAILURE(status)){
|
|
errln("FAIL: " + t->getID()+ ".transliterate(Replaceable, int32_t[], UnicodeString, UErrorCode)-->" + (UnicodeString)u_errorName(status));
|
|
continue;
|
|
}
|
|
}else {
|
|
log = s + " => ";
|
|
t->finishTransliteration(s, index);
|
|
}
|
|
// Show the start index '{' and the cursor '|'
|
|
displayOutput(s, Data[i+1], log, index);
|
|
|
|
}
|
|
|
|
s="";
|
|
status=U_ZERO_ERROR;
|
|
index.contextStart = index.contextLimit = index.start = index.limit = 0;
|
|
logln("Testing transliterate(Replaceable, int32_t, UChar, UErrorCode)");
|
|
for(i=10; i<UPRV_LENGTHOF(Data); i=i+2){
|
|
UnicodeString log;
|
|
if (Data[i+0] != "") {
|
|
log = s + " + " + Data[i+0] + " -> ";
|
|
UChar c=Data[i+0].charAt(0);
|
|
t->transliterate(s, index, c, status);
|
|
if(U_FAILURE(status)) {
|
|
errln("FAIL: " + t->getID()+ ".transliterate(Replaceable, int32_t[], UChar, UErrorCode)-->" + (UnicodeString)u_errorName(status));
|
|
continue;
|
|
}
|
|
} else {
|
|
log = s + " => ";
|
|
t->finishTransliteration(s, index);
|
|
}
|
|
// Show the start index '{' and the cursor '|'
|
|
displayOutput(s, Data[i+1], log, index);
|
|
}
|
|
|
|
delete t;
|
|
}
|
|
|
|
void TransliteratorAPITest::TestKeyboardTransliterator2(){
|
|
UnicodeString Data[]={
|
|
//insertion, buffer, index[START], index[LIMIT], index[CURSOR]
|
|
//data for Any-Hex
|
|
"abc", UnicodeString("Initial String: add-\\u0061\\u0062\\u0063-", ""), "19", "20", "20",
|
|
"a", UnicodeString("In\\u0069\\u0061tial String: add-\\u0061\\u0062\\u0063-", ""), "2", "3", "2" ,
|
|
"b", UnicodeString("\\u0062In\\u0069\\u0061tial String: add-\\u0061\\u0062\\u0063-", ""), "0", "0", "0" ,
|
|
"", UnicodeString("\\u0062In\\u0069\\u0061tial String: add-\\u0061\\u0062\\u0063-", ""), "0", "0", "0" ,
|
|
//data for Latin-Devanagiri
|
|
CharsToUnicodeString("a\\u0304"), CharsToUnicodeString("Hindi -\\u0906-"), "6", "7", "6",
|
|
CharsToUnicodeString("ma\\u0304"), CharsToUnicodeString("Hindi -\\u0906\\u092E\\u093E-"), "7", "8", "7",
|
|
CharsToUnicodeString("ra\\u0304"), CharsToUnicodeString("Hi\\u0930\\u093Endi -\\u0906\\u092E\\u093E-"),"1", "2", "2",
|
|
CharsToUnicodeString(""), CharsToUnicodeString("Hi\\u0930\\u093Endi -\\u0906\\u092E\\u093E-"),"1", "2", "2"
|
|
//data for contracted-Expanded
|
|
// CharsToUnicodeString("\\u00C1"), CharsToUnicodeString("Ad\\u0041\\u0301d here:"), "1", "2", "1" ,
|
|
// CharsToUnicodeString("\\u00C0"), CharsToUnicodeString("Ad\\u0041\\u0301d here:\\u0041\\u0300"), "11", "11", "11",
|
|
// "", CharsToUnicodeString("Ad\\u0041\\u0301d here:\\u0041\\u0300"), "11", "11", "11",
|
|
};
|
|
Transliterator *t;
|
|
UnicodeString rs;
|
|
UnicodeString dataStr;
|
|
logln("Testing transliterate(Replaceable, int32_t, UnicodeString, UErrorCode)");
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
UParseError parseError;
|
|
rs="Initial String: add--";
|
|
t=Transliterator::createInstance("Any-Hex", UTRANS_FORWARD, parseError, status);
|
|
if(t == 0)
|
|
dataerrln("FAIL : construction - %s", u_errorName(status));
|
|
else {
|
|
keyboardAux(t, Data, rs, 0, 20);
|
|
delete t;
|
|
}
|
|
|
|
rs="Hindi --";
|
|
t=Transliterator::createInstance("Latin-Devanagari", UTRANS_FORWARD, parseError, status);
|
|
if(t == 0)
|
|
dataerrln("FAIL : construction - %s", u_errorName(status));
|
|
else
|
|
keyboardAux(t, Data, rs, 20, 40);
|
|
|
|
|
|
// rs="Add here:";
|
|
// t=Transliterator::createInstance("Contracted-Expanded");
|
|
// keyboardAux(t, Data, rs, 35, 55);
|
|
|
|
|
|
delete t;
|
|
}
|
|
|
|
void TransliteratorAPITest::TestKeyboardTransliterator3(){
|
|
UnicodeString s="This is the main string";
|
|
UnicodeString Data[] = {
|
|
"0", "0", "0", "This is the main string",
|
|
"1", "3", "2", UnicodeString("Th\\u0069s is the main string", ""),
|
|
"20", "21", "20", UnicodeString("Th\\u0069s is the mai\\u006E string", "")
|
|
};
|
|
|
|
UErrorCode status=U_ZERO_ERROR;
|
|
UParseError parseError;
|
|
UTransPosition index={0, 0, 0, 0};
|
|
logln("Testing transliterate(Replaceable, int32_t, UErrorCode)");
|
|
Transliterator *t=Transliterator::createInstance("Any-Hex", UTRANS_FORWARD, parseError, status);
|
|
if(t == 0 || U_FAILURE(status)) {
|
|
errln("Error creating transliterator %s", u_errorName(status));
|
|
delete t;
|
|
return;
|
|
}
|
|
for(uint32_t i=0; i<UPRV_LENGTHOF(Data); i=i+4){
|
|
UnicodeString log;
|
|
index.contextStart=getInt(Data[i+0]);
|
|
index.contextLimit=index.limit=getInt(Data[i+1]);
|
|
index.start=getInt(Data[i+2]);
|
|
t->transliterate(s, index, status);
|
|
if(U_FAILURE(status)){
|
|
errln("FAIL: " + t->getID()+ ".transliterate(Replaceable, int32_t[], UErrorCode)-->" + (UnicodeString)u_errorName(status));
|
|
continue;
|
|
}
|
|
t->finishTransliteration(s, index);
|
|
log = s + " => ";
|
|
// Show the start index '{' and the cursor '|'
|
|
displayOutput(s, Data[i+3], log, index);
|
|
}
|
|
|
|
delete t;
|
|
}
|
|
void TransliteratorAPITest::TestNullTransliterator(){
|
|
UErrorCode status=U_ZERO_ERROR;
|
|
UnicodeString s("Transliterate using null transliterator");
|
|
Transliterator *nullTrans=Transliterator::createInstance("Any-Null", UTRANS_FORWARD, status);
|
|
int32_t transLimit;
|
|
int32_t start=0;
|
|
int32_t limit=s.length();
|
|
UnicodeString replaceable=s;
|
|
transLimit=nullTrans->transliterate(replaceable, start, limit);
|
|
if(transLimit != limit){
|
|
errln("ERROR: NullTransliterator->transliterate() failed");
|
|
}
|
|
doTest((UnicodeString)"nulTrans->transliterate", replaceable, s);
|
|
replaceable.remove();
|
|
replaceable.append(s);
|
|
UTransPosition index;
|
|
index.contextStart =start;
|
|
index.contextLimit = limit;
|
|
index.start = 0;
|
|
index.limit = limit;
|
|
nullTrans->finishTransliteration(replaceable, index);
|
|
if(index.start != limit){
|
|
errln("ERROR: NullTransliterator->handleTransliterate() failed");
|
|
}
|
|
doTest((UnicodeString)"NullTransliterator->handleTransliterate", replaceable, s);
|
|
callEverything(nullTrans, __LINE__);
|
|
delete nullTrans;
|
|
|
|
|
|
}
|
|
void TransliteratorAPITest::TestRegisterUnregister(){
|
|
|
|
UErrorCode status=U_ZERO_ERROR;
|
|
/* Make sure it doesn't exist */
|
|
if (Transliterator::createInstance("TestA-TestB", UTRANS_FORWARD, status) != NULL) {
|
|
errln("FAIL: TestA-TestB already registered\n");
|
|
return;
|
|
}
|
|
/* Check inverse too
|
|
if (Transliterator::createInstance("TestA-TestB",
|
|
(UTransDirection)UTRANS_REVERSE) != NULL) {
|
|
errln("FAIL: TestA-TestB inverse already registered\n");
|
|
return;
|
|
}
|
|
*/
|
|
status =U_ZERO_ERROR;
|
|
|
|
/* Create it */
|
|
UParseError parseError;
|
|
Transliterator *t = Transliterator::createFromRules("TestA-TestB",
|
|
"a<>b",
|
|
UTRANS_FORWARD, parseError,
|
|
status);
|
|
/* Register it */
|
|
Transliterator::registerInstance(t);
|
|
|
|
/* Now check again -- should exist now*/
|
|
Transliterator *s = Transliterator::createInstance("TestA-TestB", UTRANS_FORWARD, status);
|
|
if (s == NULL) {
|
|
errln("FAIL: TestA-TestB not registered\n");
|
|
return;
|
|
}
|
|
callEverything(s, __LINE__);
|
|
callEverything(t, __LINE__);
|
|
delete s;
|
|
|
|
/* Check inverse too
|
|
s = Transliterator::createInstance("TestA-TestB",
|
|
(UTransDirection)UTRANS_REVERSE);
|
|
if (s == NULL) {
|
|
errln("FAIL: TestA-TestB inverse not registered\n");
|
|
return;
|
|
}
|
|
delete s;
|
|
*/
|
|
|
|
/*unregister the instance*/
|
|
Transliterator::unregister("TestA-TestB");
|
|
/* now Make sure it doesn't exist */
|
|
if (Transliterator::createInstance("TestA-TestB", UTRANS_FORWARD, status) != NULL) {
|
|
errln("FAIL: TestA-TestB isn't unregistered\n");
|
|
return;
|
|
}
|
|
|
|
}
|
|
|
|
|
|
int gTestFilter1ClassID = 0;
|
|
int gTestFilter2ClassID = 0;
|
|
int gTestFilter3ClassID = 0;
|
|
|
|
/**
|
|
* Used by TestFiltering().
|
|
*/
|
|
class TestFilter1 : public UnicodeFilter {
|
|
UClassID getDynamicClassID()const { return &gTestFilter1ClassID; }
|
|
virtual TestFilter1* clone() const {
|
|
return new TestFilter1(*this);
|
|
}
|
|
virtual UBool contains(UChar32 c) const {
|
|
if(c==0x63 || c==0x61 || c==0x43 || c==0x41)
|
|
return FALSE;
|
|
else
|
|
return TRUE;
|
|
}
|
|
// Stubs
|
|
virtual UnicodeString& toPattern(UnicodeString& result,
|
|
UBool /*escapeUnprintable*/) const {
|
|
return result;
|
|
}
|
|
virtual UBool matchesIndexValue(uint8_t /*v*/) const {
|
|
return FALSE;
|
|
}
|
|
virtual void addMatchSetTo(UnicodeSet& /*toUnionTo*/) const {}
|
|
};
|
|
class TestFilter2 : public UnicodeFilter {
|
|
UClassID getDynamicClassID()const { return &gTestFilter2ClassID; }
|
|
virtual TestFilter2* clone() const {
|
|
return new TestFilter2(*this);
|
|
}
|
|
virtual UBool contains(UChar32 c) const {
|
|
if(c==0x65 || c==0x6c)
|
|
return FALSE;
|
|
else
|
|
return TRUE;
|
|
}
|
|
// Stubs
|
|
virtual UnicodeString& toPattern(UnicodeString& result,
|
|
UBool /*escapeUnprintable*/) const {
|
|
return result;
|
|
}
|
|
virtual UBool matchesIndexValue(uint8_t /*v*/) const {
|
|
return FALSE;
|
|
}
|
|
virtual void addMatchSetTo(UnicodeSet& /*toUnionTo*/) const {}
|
|
};
|
|
class TestFilter3 : public UnicodeFilter {
|
|
UClassID getDynamicClassID()const { return &gTestFilter3ClassID; }
|
|
virtual TestFilter3* clone() const {
|
|
return new TestFilter3(*this);
|
|
}
|
|
virtual UBool contains(UChar32 c) const {
|
|
if(c==0x6f || c==0x77)
|
|
return FALSE;
|
|
else
|
|
return TRUE;
|
|
}
|
|
// Stubs
|
|
virtual UnicodeString& toPattern(UnicodeString& result,
|
|
UBool /*escapeUnprintable*/) const {
|
|
return result;
|
|
}
|
|
virtual UBool matchesIndexValue(uint8_t /*v*/) const {
|
|
return FALSE;
|
|
}
|
|
virtual void addMatchSetTo(UnicodeSet& /*toUnionTo*/) const {}
|
|
};
|
|
|
|
|
|
void TransliteratorAPITest::TestGetAdoptFilter(){
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
UParseError parseError;
|
|
Transliterator *t=Transliterator::createInstance("Any-Hex", UTRANS_FORWARD, parseError, status);
|
|
if(t == 0 || U_FAILURE(status)) {
|
|
errln("Error creating transliterator %s", u_errorName(status));
|
|
delete t;
|
|
return;
|
|
}
|
|
const UnicodeFilter *u=t->getFilter();
|
|
if(u != NULL){
|
|
errln("FAIL: getFilter failed. Didn't return null when the transliterator used no filtering");
|
|
delete t;
|
|
return;
|
|
}
|
|
|
|
UnicodeString got, temp, message;
|
|
UnicodeString data="ABCabcbbCBa";
|
|
temp = data;
|
|
t->transliterate(temp);
|
|
t->adoptFilter(new TestFilter1);
|
|
|
|
got = data;
|
|
t->transliterate(got);
|
|
UnicodeString exp=UnicodeString("A\\u0042Ca\\u0062c\\u0062\\u0062C\\u0042a", "");
|
|
message="transliteration after adoptFilter(a,A,c,C) ";
|
|
doTest(message, got, exp);
|
|
|
|
logln("Testing round trip");
|
|
t->adoptFilter((UnicodeFilter*)u);
|
|
if(t->getFilter() == NULL)
|
|
logln("OK: adoptFilter and getFilter round trip worked");
|
|
else
|
|
errln("FAIL: adoptFilter or getFilter round trip failed");
|
|
|
|
got = data;
|
|
t->transliterate(got);
|
|
exp=UnicodeString("\\u0041\\u0042\\u0043\\u0061\\u0062\\u0063\\u0062\\u0062\\u0043\\u0042\\u0061", "");
|
|
message="transliteration after adopting null filter";
|
|
doTest(message, got, exp);
|
|
message="adoptFilter round trip";
|
|
doTest("adoptFilter round trip", got, temp);
|
|
|
|
t->adoptFilter(new TestFilter2);
|
|
callEverything(t, __LINE__);
|
|
data="heelloe";
|
|
exp=UnicodeString("\\u0068eell\\u006Fe", "");
|
|
got = data;
|
|
t->transliterate(got);
|
|
message="transliteration using (e,l) filter";
|
|
doTest("transliteration using (e,l) filter", got, exp);
|
|
|
|
data="are well";
|
|
exp=UnicodeString("\\u0061\\u0072e\\u0020\\u0077ell", "");
|
|
got = data;
|
|
t->transliterate(got);
|
|
doTest(message, got, exp);
|
|
|
|
t->adoptFilter(new TestFilter3);
|
|
data="ho, wow!";
|
|
exp=UnicodeString("\\u0068o\\u002C\\u0020wow\\u0021", "");
|
|
got = data;
|
|
t->transliterate(got);
|
|
message="transliteration using (o,w) filter";
|
|
doTest("transliteration using (o,w) filter", got, exp);
|
|
|
|
data="owl";
|
|
exp=UnicodeString("ow\\u006C", "");
|
|
got = data;
|
|
t->transliterate(got);
|
|
doTest("transliteration using (o,w) filter", got, exp);
|
|
|
|
delete t;
|
|
|
|
}
|
|
|
|
|
|
|
|
void TransliteratorAPITest::keyboardAux(Transliterator *t, UnicodeString DATA[], UnicodeString& s, int32_t begin, int32_t end) {
|
|
UTransPosition index={0, 0, 0, 0};
|
|
UErrorCode status=U_ZERO_ERROR;
|
|
for (int32_t i=begin; i<end; i=i+5) {
|
|
UnicodeString log;
|
|
if (DATA[i+0] != "") {
|
|
log = s + " + " + DATA[i] + " -> ";
|
|
index.contextStart=getInt(DATA[i+2]);
|
|
index.contextLimit=index.limit=getInt(DATA[i+3]);
|
|
index.start=getInt(DATA[i+4]);
|
|
t->transliterate(s, index, DATA[i+0], status);
|
|
if(U_FAILURE(status)){
|
|
errln("FAIL: " + t->getID()+ ".transliterate(Replaceable, int32_t[], UnicodeString, UErrorCode)-->" + (UnicodeString)u_errorName(status));
|
|
continue;
|
|
}
|
|
log = s + " => ";
|
|
t->finishTransliteration(s, index);
|
|
}
|
|
// Show the start index '{' and the cursor '|'
|
|
displayOutput(s, DATA[i+1], log, index);
|
|
|
|
}
|
|
}
|
|
|
|
void TransliteratorAPITest::displayOutput(const UnicodeString& got, const UnicodeString& expected, UnicodeString& log, UTransPosition& index){
|
|
// Show the start index '{' and the cursor '|'
|
|
UnicodeString a, b, c, d, e;
|
|
got.extractBetween(0, index.contextStart, a);
|
|
got.extractBetween(index.contextStart, index.start, b);
|
|
got.extractBetween(index.start, index.limit, c);
|
|
got.extractBetween(index.limit, index.contextLimit, d);
|
|
got.extractBetween(index.contextLimit, got.length(), e);
|
|
log.append(a).
|
|
append((UChar)0x7b/*{*/).
|
|
append(b).
|
|
append((UChar)0x7c/*|*/).
|
|
append(c).
|
|
append((UChar)0x7c).
|
|
append(d).
|
|
append((UChar)0x7d/*}*/).
|
|
append(e);
|
|
if (got == expected)
|
|
logln("OK:" + prettify(log));
|
|
else
|
|
errln("FAIL: " + prettify(log) + ", expected " + prettify(expected));
|
|
}
|
|
|
|
|
|
/*Internal Functions used*/
|
|
void TransliteratorAPITest::doTest(const UnicodeString& message, const UnicodeString& result, const UnicodeString& expected){
|
|
if (prettify(result) == prettify(expected))
|
|
logln((UnicodeString)"Ok: " + prettify(message) + " passed \"" + prettify(expected) + "\"");
|
|
else
|
|
dataerrln((UnicodeString)"FAIL:" + message + " failed Got-->" + prettify(result)+ ", Expected--> " + prettify(expected) );
|
|
}
|
|
|
|
|
|
//
|
|
// callEverything call all of the const (non-destructive) methods on a
|
|
// transliterator, just to verify that they don't fail in some
|
|
// destructive way.
|
|
//
|
|
#define CEASSERT(a) UPRV_BLOCK_MACRO_BEGIN { \
|
|
if (!(a)) { \
|
|
errln("FAIL at line %d from line %d: %s", __LINE__, line, #a); \
|
|
return; \
|
|
} \
|
|
} UPRV_BLOCK_MACRO_END
|
|
|
|
void TransliteratorAPITest::callEverything(const Transliterator *tr, int line) {
|
|
Transliterator *clonedTR = tr->clone();
|
|
CEASSERT(clonedTR != NULL);
|
|
|
|
int32_t maxcl = tr->getMaximumContextLength();
|
|
CEASSERT(clonedTR->getMaximumContextLength() == maxcl);
|
|
|
|
UnicodeString id;
|
|
UnicodeString clonedId;
|
|
id = tr->getID();
|
|
clonedId = clonedTR->getID();
|
|
CEASSERT(id == clonedId);
|
|
|
|
const UnicodeFilter *filter = tr->getFilter();
|
|
const UnicodeFilter *clonedFilter = clonedTR->getFilter();
|
|
if (filter == NULL || clonedFilter == NULL) {
|
|
// If one filter is NULL they better both be NULL.
|
|
CEASSERT(filter == clonedFilter);
|
|
} else {
|
|
CEASSERT(filter != clonedFilter);
|
|
}
|
|
|
|
UnicodeString rules;
|
|
UnicodeString clonedRules;
|
|
rules = tr->toRules(rules, FALSE);
|
|
clonedRules = clonedTR->toRules(clonedRules, FALSE);
|
|
CEASSERT(rules == clonedRules);
|
|
|
|
UnicodeSet sourceSet;
|
|
UnicodeSet clonedSourceSet;
|
|
tr->getSourceSet(sourceSet);
|
|
clonedTR->getSourceSet(clonedSourceSet);
|
|
CEASSERT(clonedSourceSet == sourceSet);
|
|
|
|
UnicodeSet targetSet;
|
|
UnicodeSet clonedTargetSet;
|
|
tr->getTargetSet(targetSet);
|
|
clonedTR->getTargetSet(clonedTargetSet);
|
|
CEASSERT(targetSet == clonedTargetSet);
|
|
|
|
UClassID classID = tr->getDynamicClassID();
|
|
CEASSERT(classID == clonedTR->getDynamicClassID());
|
|
CEASSERT(classID != 0);
|
|
|
|
delete clonedTR;
|
|
}
|
|
|
|
static const int MyUnicodeFunctorTestClassID = 0;
|
|
class MyUnicodeFunctorTestClass : public UnicodeFunctor {
|
|
public:
|
|
virtual UnicodeFunctor* clone() const {return NULL;}
|
|
static UClassID getStaticClassID(void) {return (UClassID)&MyUnicodeFunctorTestClassID;}
|
|
virtual UClassID getDynamicClassID(void) const {return getStaticClassID();}
|
|
virtual void setData(const TransliterationRuleData*) {}
|
|
};
|
|
|
|
void TransliteratorAPITest::TestUnicodeFunctor() {
|
|
MyUnicodeFunctorTestClass myClass;
|
|
if (myClass.toMatcher() != NULL) {
|
|
errln("FAIL: UnicodeFunctor::toMatcher did not return NULL");
|
|
}
|
|
if (myClass.toReplacer() != NULL) {
|
|
errln("FAIL: UnicodeFunctor::toReplacer did not return NULL");
|
|
}
|
|
}
|
|
|
|
|
|
#endif /* #if !UCONFIG_NO_TRANSLITERATION */
|