1999-10-26 17:16:13 +00:00
|
|
|
/*
|
|
|
|
**********************************************************************
|
2000-03-07 02:39:27 +00:00
|
|
|
* Copyright (C) 1999, International Business Machines
|
|
|
|
* Corporation and others. All Rights Reserved.
|
1999-10-26 17:16:13 +00:00
|
|
|
**********************************************************************
|
|
|
|
* Date Name Description
|
|
|
|
* 10/20/99 alan Creation.
|
|
|
|
**********************************************************************
|
|
|
|
*/
|
|
|
|
|
1999-12-28 23:57:50 +00:00
|
|
|
#include "unicode/utypes.h"
|
1999-10-20 22:08:09 +00:00
|
|
|
#include "usettest.h"
|
1999-12-28 23:57:50 +00:00
|
|
|
#include "unicode/uniset.h"
|
1999-10-20 22:08:09 +00:00
|
|
|
|
|
|
|
#define CASE(id,test) case id: \
|
|
|
|
name = #test; \
|
|
|
|
if (exec) { \
|
|
|
|
logln(#test "---"); \
|
|
|
|
logln((UnicodeString)""); \
|
|
|
|
test(); \
|
|
|
|
} \
|
|
|
|
break;
|
|
|
|
|
|
|
|
void
|
|
|
|
UnicodeSetTest::runIndexedTest(int32_t index, bool_t exec,
|
|
|
|
char* &name, char* par) {
|
|
|
|
// if (exec) logln((UnicodeString)"TestSuite UnicodeSetTest");
|
|
|
|
switch (index) {
|
1999-10-26 17:16:13 +00:00
|
|
|
CASE(0,TestPatterns)
|
|
|
|
CASE(1,TestAddRemove)
|
2000-01-12 18:04:21 +00:00
|
|
|
CASE(2,TestCategories)
|
1999-10-20 22:08:09 +00:00
|
|
|
default: name = ""; break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void
|
1999-12-22 22:57:04 +00:00
|
|
|
UnicodeSetTest::TestPatterns(void) {
|
1999-10-26 17:16:13 +00:00
|
|
|
UnicodeSet set;
|
|
|
|
expectPattern(set, "[[a-m]&[d-z]&[k-y]]", "km");
|
|
|
|
expectPattern(set, "[[a-z]-[m-y]-[d-r]]", "aczz");
|
|
|
|
expectPattern(set, "[a\\-z]", "--aazz");
|
|
|
|
expectPattern(set, "[-az]", "--aazz");
|
|
|
|
expectPattern(set, "[az-]", "--aazz");
|
|
|
|
expectPattern(set, "[[[a-z]-[aeiou]i]]", "bdfnptvz");
|
|
|
|
|
|
|
|
// Throw in a test of complement
|
|
|
|
set.complement();
|
|
|
|
UnicodeString exp;
|
|
|
|
exp.append((UChar)0x0000).append("aeeoouu").append((UChar)('z'+1)).append((UChar)0xFFFF);
|
|
|
|
expectPairs(set, exp);
|
|
|
|
}
|
|
|
|
|
2000-01-12 18:04:21 +00:00
|
|
|
void
|
|
|
|
UnicodeSetTest::TestCategories(void) {
|
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
|
|
const char* pat = " [:Lu:] "; // Whitespace ok outside [:..:]
|
|
|
|
UnicodeSet set(pat, status);
|
|
|
|
if (U_FAILURE(status)) {
|
|
|
|
errln((UnicodeString)"Fail: Can't construct set with " + pat);
|
|
|
|
} else {
|
|
|
|
expectContainment(set, pat, "ABC", "abc");
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
1999-10-26 17:16:13 +00:00
|
|
|
void
|
1999-12-22 22:57:04 +00:00
|
|
|
UnicodeSetTest::TestAddRemove(void) {
|
1999-10-20 22:08:09 +00:00
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
|
|
|
|
|
|
UnicodeSet set; // Construct empty set
|
|
|
|
set.add('a', 'z');
|
1999-10-26 17:16:13 +00:00
|
|
|
expectPairs(set, "az");
|
1999-10-20 22:08:09 +00:00
|
|
|
set.remove('m', 'p');
|
1999-10-26 17:16:13 +00:00
|
|
|
expectPairs(set, "alqz");
|
1999-10-20 22:08:09 +00:00
|
|
|
set.remove('e', 'g');
|
1999-10-26 17:16:13 +00:00
|
|
|
expectPairs(set, "adhlqz");
|
1999-10-20 22:08:09 +00:00
|
|
|
set.remove('d', 'i');
|
1999-10-26 17:16:13 +00:00
|
|
|
expectPairs(set, "acjlqz");
|
1999-10-20 22:08:09 +00:00
|
|
|
set.remove('c', 'r');
|
1999-10-26 17:16:13 +00:00
|
|
|
expectPairs(set, "absz");
|
1999-10-20 22:08:09 +00:00
|
|
|
set.add('f', 'q');
|
1999-10-26 17:16:13 +00:00
|
|
|
expectPairs(set, "abfqsz");
|
1999-10-20 22:08:09 +00:00
|
|
|
set.remove('a', 'g');
|
1999-10-26 17:16:13 +00:00
|
|
|
expectPairs(set, "hqsz");
|
1999-10-20 22:08:09 +00:00
|
|
|
set.remove('a', 'z');
|
1999-10-26 17:16:13 +00:00
|
|
|
expectPairs(set, "");
|
1999-10-20 22:08:09 +00:00
|
|
|
|
1999-10-26 17:16:13 +00:00
|
|
|
// Try removing an entire set from another set
|
|
|
|
expectPattern(set, "[c-x]", "cx");
|
|
|
|
UnicodeSet set2;
|
|
|
|
expectPattern(set2, "[f-ky-za-bc[vw]]", "acfkvwyz");
|
|
|
|
set.removeAll(set2);
|
|
|
|
expectPairs(set, "deluxx");
|
1999-10-20 22:08:09 +00:00
|
|
|
|
1999-10-26 17:16:13 +00:00
|
|
|
// Try adding an entire set to another set
|
|
|
|
expectPattern(set, "[jackiemclean]", "aacceein");
|
|
|
|
expectPattern(set2, "[hitoshinamekatajamesanderson]", "aadehkmort");
|
|
|
|
set.addAll(set2);
|
|
|
|
expectPairs(set, "aacehort");
|
1999-10-20 22:08:09 +00:00
|
|
|
|
1999-10-26 17:16:13 +00:00
|
|
|
// Test commutativity
|
|
|
|
expectPattern(set, "[hitoshinamekatajamesanderson]", "aadehkmort");
|
|
|
|
expectPattern(set2, "[jackiemclean]", "aacceein");
|
|
|
|
set.addAll(set2);
|
|
|
|
expectPairs(set, "aacehort");
|
|
|
|
}
|
|
|
|
|
2000-01-12 18:04:21 +00:00
|
|
|
void
|
|
|
|
UnicodeSetTest::expectContainment(const UnicodeSet& set,
|
|
|
|
const UnicodeString& setName,
|
|
|
|
const UnicodeString& charsIn,
|
|
|
|
const UnicodeString& charsOut) {
|
|
|
|
UnicodeString bad;
|
|
|
|
int32_t i;
|
|
|
|
for (i=0; i<charsIn.length(); ++i) {
|
|
|
|
UChar c = charsIn.charAt(i);
|
|
|
|
if (!set.contains(c)) {
|
|
|
|
bad.append(c);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (bad.length() > 0) {
|
|
|
|
logln((UnicodeString)"Fail: set " + setName + " does not contain " + bad +
|
|
|
|
", expected containment of " + charsIn);
|
|
|
|
} else {
|
|
|
|
logln((UnicodeString)"Ok: set " + setName + " contains " + charsIn);
|
|
|
|
}
|
|
|
|
|
|
|
|
bad.truncate(0);
|
|
|
|
for (i=0; i<charsOut.length(); ++i) {
|
|
|
|
UChar c = charsOut.charAt(i);
|
|
|
|
if (set.contains(c)) {
|
|
|
|
bad.append(c);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (bad.length() > 0) {
|
|
|
|
logln((UnicodeString)"Fail: set " + setName + " contains " + bad +
|
|
|
|
", expected non-containment of " + charsOut);
|
|
|
|
} else {
|
|
|
|
logln((UnicodeString)"Ok: set " + setName + " does not contain " + charsOut);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
1999-10-26 17:16:13 +00:00
|
|
|
void
|
|
|
|
UnicodeSetTest::expectPattern(UnicodeSet& set,
|
|
|
|
const UnicodeString& pattern,
|
|
|
|
const UnicodeString& expectedPairs) {
|
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
|
|
set.applyPattern(pattern, status);
|
1999-10-20 22:08:09 +00:00
|
|
|
if (U_FAILURE(status)) {
|
1999-10-26 17:16:13 +00:00
|
|
|
errln(UnicodeString("FAIL: applyPattern(\"") + pattern +
|
|
|
|
"\") failed");
|
1999-10-20 22:08:09 +00:00
|
|
|
return;
|
1999-10-26 17:16:13 +00:00
|
|
|
} else {
|
|
|
|
if (set.getPairs() != expectedPairs) {
|
|
|
|
errln(UnicodeString("FAIL: applyPattern(\"") + pattern +
|
|
|
|
"\") => pairs \"" +
|
|
|
|
escape(set.getPairs()) + "\", expected \"" +
|
|
|
|
escape(expectedPairs) + "\"");
|
|
|
|
} else {
|
|
|
|
logln(UnicodeString("Ok: applyPattern(\"") + pattern +
|
|
|
|
"\") => pairs \"" +
|
|
|
|
escape(set.getPairs()) + "\"");
|
|
|
|
}
|
|
|
|
}
|
1999-10-20 22:08:09 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
void
|
1999-10-26 17:16:13 +00:00
|
|
|
UnicodeSetTest::expectPairs(const UnicodeSet& set, const UnicodeString& expectedPairs) {
|
1999-10-20 22:08:09 +00:00
|
|
|
if (set.getPairs() != expectedPairs) {
|
|
|
|
errln(UnicodeString("FAIL: Expected pair list \"") +
|
|
|
|
escape(expectedPairs) + "\", got \"" +
|
1999-10-26 17:16:13 +00:00
|
|
|
escape(set.getPairs()) + "\"");
|
1999-10-20 22:08:09 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
1999-10-26 17:16:13 +00:00
|
|
|
static UChar toHexString(int32_t i) { return i + (i < 10 ? '0' : ('A' - 10)); }
|
1999-10-20 22:08:09 +00:00
|
|
|
|
|
|
|
UnicodeString
|
|
|
|
UnicodeSetTest::escape(const UnicodeString& s) {
|
|
|
|
UnicodeString buf;
|
1999-12-08 02:11:04 +00:00
|
|
|
for (int32_t i=0; i<s.length(); ++i)
|
1999-10-20 22:08:09 +00:00
|
|
|
{
|
|
|
|
UChar c = s[(UTextOffset)i];
|
1999-10-26 17:16:13 +00:00
|
|
|
if (' ' <= c && c <= (UChar)0x7F) {
|
|
|
|
buf += c;
|
|
|
|
} else {
|
|
|
|
buf += '\\'; buf += 'u';
|
1999-10-20 22:08:09 +00:00
|
|
|
buf += toHexString((c & 0xF000) >> 12);
|
|
|
|
buf += toHexString((c & 0x0F00) >> 8);
|
|
|
|
buf += toHexString((c & 0x00F0) >> 4);
|
|
|
|
buf += toHexString(c & 0x000F);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return buf;
|
|
|
|
}
|