scuffed-code/icu4c/source/test/intltest/canittst.cpp

/********************************************************************
 * COPYRIGHT: 
 * Copyright (c) 2002-2006, International Business Machines Corporation and
 * others. All Rights Reserved.
 ********************************************************************
 *
 * @author Mark E. Davis
 * @author Vladimir Weinstein
 */

#include "unicode/utypes.h"

#if !UCONFIG_NO_NORMALIZATION

#include "intltest.h"
#include "cstring.h"
#include "canittst.h"
#include "unicode/caniter.h"
#include "unicode/normlzr.h"
#include "unicode/uchar.h"
#include "hash.h"

#define ARRAY_LENGTH(array) ((int32_t)(sizeof (array) / sizeof (*array)))

#define CASE(id,test) case id:                          \
                          name = #test;                 \
                          if (exec) {                   \
                              logln(#test "---");       \
                              logln((UnicodeString)""); \
                              test();                   \
                          }                             \
                          break

void CanonicalIteratorTest::runIndexedTest(int32_t index, UBool exec,
                                         const char* &name, char* /*par*/) {
    switch (index) {
        CASE(0, TestBasic);
        CASE(1, TestExhaustive);
        CASE(2, TestAPI);
      default: name = ""; break;
    }
}

/**
 * Convert Java-style strings with \u Unicode escapes into UnicodeString objects
static UnicodeString str(const char *input)
{
    UnicodeString str(input, ""); // Invariant conversion
    return str.unescape();
}
 */


CanonicalIteratorTest::CanonicalIteratorTest() :
nameTrans(NULL), hexTrans(NULL)
{
}

CanonicalIteratorTest::~CanonicalIteratorTest()
{
#if !UCONFIG_NO_TRANSLITERATION
  if(nameTrans != NULL) {
    delete(nameTrans);
  }
  if(hexTrans != NULL) {
    delete(hexTrans);
  }
#endif
}

void CanonicalIteratorTest::TestExhaustive() {
    UErrorCode status = U_ZERO_ERROR;
    CanonicalIterator it("", status);
    UChar32 i = 0;
    UnicodeString s;
    // Test static and dynamic class IDs
    if(it.getDynamicClassID() != CanonicalIterator::getStaticClassID()){
        errln("CanonicalIterator::getStaticClassId ! = CanonicalIterator.getDynamicClassID");
    }
    for (i = 0; i < 0x10FFFF; quick?i+=0x10:++i) {
        //for (i = 0xae00; i < 0xaf00; ++i) {
        
        if ((i % 0x100) == 0) {
            logln("Testing U+%06X", i);
        }
        
        // skip characters we know don't have decomps
        int8_t type = u_charType(i);
        if (type == U_UNASSIGNED || type == U_PRIVATE_USE_CHAR
            || type == U_SURROGATE) continue;
        
        s = i;
        characterTest(s, i, it);

        s += (UChar32)0x0345; //"\\u0345";
        characterTest(s, i, it);
    }
}

void CanonicalIteratorTest::TestBasic() {

    UErrorCode status = U_ZERO_ERROR;

    static const char * const testArray[][2] = {
        {"\\u00C5d\\u0307\\u0327", "A\\u030Ad\\u0307\\u0327, A\\u030Ad\\u0327\\u0307, A\\u030A\\u1E0B\\u0327, "
            "A\\u030A\\u1E11\\u0307, \\u00C5d\\u0307\\u0327, \\u00C5d\\u0327\\u0307, "
            "\\u00C5\\u1E0B\\u0327, \\u00C5\\u1E11\\u0307, \\u212Bd\\u0307\\u0327, "
            "\\u212Bd\\u0327\\u0307, \\u212B\\u1E0B\\u0327, \\u212B\\u1E11\\u0307"},
        {"\\u010d\\u017E", "c\\u030Cz\\u030C, c\\u030C\\u017E, \\u010Dz\\u030C, \\u010D\\u017E"},
        {"x\\u0307\\u0327", "x\\u0307\\u0327, x\\u0327\\u0307, \\u1E8B\\u0327"},
    };
    
#if 0
    // This is not interesting for C/C++ as the data is already built beforehand
    // check build
    UnicodeSet ss = CanonicalIterator.getSafeStart();
    logln("Safe Start: " + ss.toPattern(true));
    ss = CanonicalIterator.getStarts('a');
    expectEqual("Characters with 'a' at the start of their decomposition: ", "", CanonicalIterator.getStarts('a'),
        new UnicodeSet("[\u00E0-\u00E5\u0101\u0103\u0105\u01CE\u01DF\u01E1\u01FB"
        + "\u0201\u0203\u0227\u1E01\u1EA1\u1EA3\u1EA5\u1EA7\u1EA9\u1EAB\u1EAD\u1EAF\u1EB1\u1EB3\u1EB5\u1EB7]")
            );
#endif

    // check permute
    // NOTE: we use a TreeSet below to sort the output, which is not guaranteed to be sorted!

    Hashtable *permutations = new Hashtable(FALSE, status);
    permutations->setValueDeleter(uhash_deleteUnicodeString);
    UnicodeString toPermute("ABC");

    CanonicalIterator::permute(toPermute, FALSE, permutations, status);

    logln("testing permutation");
  
    expectEqual("Simple permutation ", "", collectionToString(permutations), "ABC, ACB, BAC, BCA, CAB, CBA");

    delete permutations;
    
    // try samples
    logln("testing samples");
    Hashtable *set = new Hashtable(FALSE, status);
    set->setValueDeleter(uhash_deleteUnicodeString);
    int32_t i = 0;
    CanonicalIterator it("", status);
    if(U_SUCCESS(status)) {
      for (i = 0; i < ARRAY_LENGTH(testArray); ++i) {
          //logln("Results for: " + name.transliterate(testArray[i]));
          UnicodeString testStr = CharsToUnicodeString(testArray[i][0]);
          it.setSource(testStr, status);
          set->removeAll();
          while (TRUE) {
              //UnicodeString *result = new UnicodeString(it.next());
              UnicodeString result(it.next());
              if (result.isBogus()) {
                  break;
              }
              set->put(result, new UnicodeString(result), status); // Add result to the table
              //logln(++counter + ": " + hex.transliterate(result));
              //logln(" = " + name.transliterate(result));
          }
          expectEqual(i + ": ", testStr, collectionToString(set), CharsToUnicodeString(testArray[i][1]));

      }
    } else {
      errln("Couldn't instantiate canonical iterator. Error: %s", u_errorName(status));
    }
    delete set;
}

void CanonicalIteratorTest::characterTest(UnicodeString &s, UChar32 ch, CanonicalIterator &it)
{
    UErrorCode status = U_ZERO_ERROR;
    UnicodeString decomp, comp;
    UBool gotDecomp = FALSE;
    UBool gotComp = FALSE;
    UBool gotSource = FALSE;

    Normalizer::decompose(s, FALSE, 0, decomp, status);
    Normalizer::compose(s, FALSE, 0, comp, status);
    
    // skip characters that don't have either decomp.
    // need quick test for this!
    if (s == decomp && s == comp) {
        return;
    }
    
    it.setSource(s, status);
    
    while (TRUE) {
        UnicodeString item = it.next();
        if (item.isBogus()) break;
        if (item == s) gotSource = TRUE;
        if (item == decomp) gotDecomp = TRUE;
        if (item == comp) gotComp = TRUE;
    }
    
    if (!gotSource || !gotDecomp || !gotComp) {
        errln("FAIL CanonicalIterator: " + s + (int)ch);
    }
}

void CanonicalIteratorTest::expectEqual(const UnicodeString &message, const UnicodeString &item, const UnicodeString &a, const UnicodeString &b) {
    if (!(a==b)) {
        errln("FAIL: " + message + getReadable(item));
        errln("\t" + getReadable(a));
        errln("\t" + getReadable(b));
    } else {
        logln("Checked: " + message + getReadable(item));
        logln("\t" + getReadable(a));
        logln("\t" + getReadable(b));
    }
}

UnicodeString CanonicalIteratorTest::getReadable(const UnicodeString &s) {
  UErrorCode status = U_ZERO_ERROR;
  UnicodeString result = "[";
    if (s.length() == 0) return "";
    // set up for readable display
#if !UCONFIG_NO_TRANSLITERATION
    if(verbose) {
      if (nameTrans == NULL)
          nameTrans = Transliterator::createInstance("[^\\ -\\u007F] name", UTRANS_FORWARD, status);
      UnicodeString sName = s;
      nameTrans->transliterate(sName);
      result += sName;
      result += ";";
    }
    if (hexTrans == NULL)
        hexTrans = Transliterator::createInstance("[^\\ -\\u007F] hex", UTRANS_FORWARD, status);
#endif
    UnicodeString sHex = s;
#if !UCONFIG_NO_TRANSLITERATION
    if(hexTrans) { // maybe there is no data and transliterator cannot be instantiated
      hexTrans->transliterate(sHex);
    }
#endif
    result += sHex;
    result += "]";
    return result;
    //return "[" + (verbose ? name->transliterate(s) + "; " : "") + hex->transliterate(s) + "]";
}

U_CFUNC int U_CALLCONV
compareUnicodeStrings(const void *s1, const void *s2) {
  UnicodeString **st1 = (UnicodeString **)s1;
  UnicodeString **st2 = (UnicodeString **)s2;

  return (*st1)->compare(**st2);
}


UnicodeString CanonicalIteratorTest::collectionToString(Hashtable *col) {
    UnicodeString result;

    // Iterate over the Hashtable, then qsort.

    UnicodeString **resArray = new UnicodeString*[col->count()];
    int32_t i = 0;

    const UHashElement *ne = NULL;
    int32_t el = -1;
    //Iterator it = basic.iterator();
    ne = col->nextElement(el);
    //while (it.hasNext()) 
    while (ne != NULL) {
      //String item = (String) it.next();
      UnicodeString *item = (UnicodeString *)(ne->value.pointer);
      resArray[i++] = item;
      ne = col->nextElement(el);
    }

    for(i = 0; i<col->count(); ++i) {
      logln(*resArray[i]);
    }

    qsort(resArray, col->count(), sizeof(UnicodeString *), compareUnicodeStrings);

    result = *resArray[0];

    for(i = 1; i<col->count(); ++i) {
      result += ", ";
      result += *resArray[i];
    }

/*
    Iterator it = col.iterator();
    while (it.hasNext()) {
        if (result.length() != 0) result.append(", ");
        result.append(it.next().toString());
    }
*/

    delete [] resArray;

    return result;
}

void CanonicalIteratorTest::TestAPI() {
  UErrorCode status = U_ZERO_ERROR;
  // Test reset and getSource
  UnicodeString start("ljubav");
  logln("Testing CanonicalIterator::getSource");
  logln("Instantiating canonical iterator with string "+start);
  CanonicalIterator can(start, status);
  UnicodeString source = can.getSource();
  logln("CanonicalIterator::getSource returned "+source);
  if(start != source) {
    errln("CanonicalIterator.getSource() didn't return the starting string. Expected "+start+", got "+source);
  }
  logln("Testing CanonicalIterator::reset");
  UnicodeString next = can.next();
  logln("CanonicalIterator::next returned "+next);

  can.reset();

  UnicodeString afterReset = can.next();
  logln("After reset, CanonicalIterator::next returned "+afterReset);

  if(next != afterReset) {
    errln("Next after instantiation ("+next+") is different from next after reset ("+afterReset+").");
  }
  
  logln("Testing getStaticClassID and getDynamicClassID");
  if(can.getDynamicClassID() != CanonicalIterator::getStaticClassID()){
      errln("RTTI failed for CanonicalIterator getDynamicClassID != getStaticClassID");
  }
}

#endif /* #if !UCONFIG_NO_NORMALIZATION */
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`/********************************************************************`
			`* COPYRIGHT:`
ICU-5333 Whitespace changes. X-SVN-Rev: 20119 2006-08-20 05:08:35 +00:00			`* Copyright (c) 2002-2006, International Business Machines Corporation and`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`* others. All Rights Reserved.`
			`********************************************************************`
			`*`
			`* @author Mark E. Davis`
			`* @author Vladimir Weinstein`
			`*/`

ICU-2860 add UCONFIG_NO_NORMALIZATION and UCONFIG_NO_IDNA X-SVN-Rev: 11808 2003-05-06 01:22:23 +00:00			`#include "unicode/utypes.h"`

			`#if !UCONFIG_NO_NORMALIZATION`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00
ICU-1682 Fix for AIX, remove tabs, remove CVS tags. X-SVN-Rev: 8166 2002-03-20 23:47:53 +00:00			`#include "intltest.h"`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`#include "cstring.h"`
			`#include "canittst.h"`
ICU-2209 make canonical iterator public X-SVN-Rev: 9866 2002-09-17 05:06:04 +00:00			`#include "unicode/caniter.h"`
ICU-3326 Don't include some unneeded headers. X-SVN-Rev: 13965 2003-12-03 06:58:28 +00:00			`#include "unicode/normlzr.h"`
ICU-2085 Don't use deprecated or unused includes X-SVN-Rev: 9761 2002-08-21 21:33:16 +00:00			`#include "unicode/uchar.h"`
ICU-3326 Don't include some unneeded headers. X-SVN-Rev: 13965 2003-12-03 06:58:28 +00:00			`#include "hash.h"`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00
			`#define ARRAY_LENGTH(array) ((int32_t)(sizeof (array) / sizeof (*array)))`

			`#define CASE(id,test) case id: \`
			`name = #test; \`
			`if (exec) { \`
			`logln(#test "---"); \`
			`logln((UnicodeString)""); \`
			`test(); \`
			`} \`
			`break`

			`void CanonicalIteratorTest::runIndexedTest(int32_t index, UBool exec,`
			`const char* &name, char* /par/) {`
			`switch (index) {`
			`CASE(0, TestBasic);`
			`CASE(1, TestExhaustive);`
ICU-2039 increase code coverage for canonical iterator X-SVN-Rev: 9471 2002-07-31 20:41:40 +00:00			`CASE(2, TestAPI);`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`default: name = ""; break;`
			`}`
			`}`

			`/**`
			`* Convert Java-style strings with \u Unicode escapes into UnicodeString objects`
			`static UnicodeString str(const char *input)`
			`{`
			`UnicodeString str(input, ""); // Invariant conversion`
			`return str.unescape();`
			`}`
ICU-900 Fixed some compiler warnings. X-SVN-Rev: 8379 2002-04-04 20:06:49 +00:00			`*/`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00

			`CanonicalIteratorTest::CanonicalIteratorTest() :`
ICU-900 Fixed some compiler warnings. X-SVN-Rev: 8304 2002-03-29 19:56:29 +00:00			`nameTrans(NULL), hexTrans(NULL)`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`{`
			`}`

			`CanonicalIteratorTest::~CanonicalIteratorTest()`
			`{`
ICU-2248 modularize ICU X-SVN-Rev: 9910 2002-09-21 00:43:14 +00:00			`#if !UCONFIG_NO_TRANSLITERATION`
ICU-900 Fixed some compiler warnings. X-SVN-Rev: 8304 2002-03-29 19:56:29 +00:00			`if(nameTrans != NULL) {`
			`delete(nameTrans);`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`}`
ICU-900 Fixed some compiler warnings. X-SVN-Rev: 8304 2002-03-29 19:56:29 +00:00			`if(hexTrans != NULL) {`
			`delete(hexTrans);`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`}`
ICU-2248 modularize ICU X-SVN-Rev: 9910 2002-09-21 00:43:14 +00:00			`#endif`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`}`

			`void CanonicalIteratorTest::TestExhaustive() {`
ICU-1682 Fix for AIX, remove tabs, remove CVS tags. X-SVN-Rev: 8166 2002-03-20 23:47:53 +00:00			`UErrorCode status = U_ZERO_ERROR;`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`CanonicalIterator it("", status);`
			`UChar32 i = 0;`
ICU-4465 Change TestExhaustive to try the character with and without u+0345. X-SVN-Rev: 17442 2005-04-01 01:14:25 +00:00			`UnicodeString s;`
ICU-4161 remove tabs from source code X-SVN-Rev: 16829 2004-11-11 23:34:58 +00:00			`// Test static and dynamic class IDs`
ICU-2118 improve API coverage X-SVN-Rev: 10393 2002-11-27 02:11:42 +00:00			`if(it.getDynamicClassID() != CanonicalIterator::getStaticClassID()){`
ICU-4161 remove tabs from source code X-SVN-Rev: 16829 2004-11-11 23:34:58 +00:00			`errln("CanonicalIterator::getStaticClassId ! = CanonicalIterator.getDynamicClassID");`
			`}`
ICU-1682 faster exhaustive test for debug runs X-SVN-Rev: 8147 2002-03-20 05:14:00 +00:00			`for (i = 0; i < 0x10FFFF; quick?i+=0x10:++i) {`
ICU-1682 Fix for AIX, remove tabs, remove CVS tags. X-SVN-Rev: 8166 2002-03-20 23:47:53 +00:00			`//for (i = 0xae00; i < 0xaf00; ++i) {`

			`if ((i % 0x100) == 0) {`
			`logln("Testing U+%06X", i);`
			`}`

			`// skip characters we know don't have decomps`
			`int8_t type = u_charType(i);`
			`if (type == U_UNASSIGNED \|\| type == U_PRIVATE_USE_CHAR`
			`\|\| type == U_SURROGATE) continue;`

			`s = i;`
ICU-5333 Whitespace changes. X-SVN-Rev: 20119 2006-08-20 05:08:35 +00:00			`characterTest(s, i, it);`
ICU-4465 Change TestExhaustive to try the character with and without u+0345. X-SVN-Rev: 17442 2005-04-01 01:14:25 +00:00
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`s += (UChar32)0x0345; //"\\u0345";`
ICU-5333 Whitespace changes. X-SVN-Rev: 20119 2006-08-20 05:08:35 +00:00			`characterTest(s, i, it);`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`}`
			`}`

			`void CanonicalIteratorTest::TestBasic() {`

ICU-1682 Fix for AIX, remove tabs, remove CVS tags. X-SVN-Rev: 8176 2002-03-21 17:59:20 +00:00			`UErrorCode status = U_ZERO_ERROR;`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00
ICU-1682 Fix for AIX, remove tabs, remove CVS tags. X-SVN-Rev: 8176 2002-03-21 17:59:20 +00:00			`static const char * const testArray[][2] = {`
			`{"\\u00C5d\\u0307\\u0327", "A\\u030Ad\\u0307\\u0327, A\\u030Ad\\u0327\\u0307, A\\u030A\\u1E0B\\u0327, "`
ICU-1682 Fix for AIX, remove tabs, remove CVS tags. X-SVN-Rev: 8166 2002-03-20 23:47:53 +00:00			`"A\\u030A\\u1E11\\u0307, \\u00C5d\\u0307\\u0327, \\u00C5d\\u0327\\u0307, "`
			`"\\u00C5\\u1E0B\\u0327, \\u00C5\\u1E11\\u0307, \\u212Bd\\u0307\\u0327, "`
ICU-1682 Fix for AIX, remove tabs, remove CVS tags. X-SVN-Rev: 8176 2002-03-21 17:59:20 +00:00			`"\\u212Bd\\u0327\\u0307, \\u212B\\u1E0B\\u0327, \\u212B\\u1E11\\u0307"},`
			`{"\\u010d\\u017E", "c\\u030Cz\\u030C, c\\u030C\\u017E, \\u010Dz\\u030C, \\u010D\\u017E"},`
			`{"x\\u0307\\u0327", "x\\u0307\\u0327, x\\u0327\\u0307, \\u1E8B\\u0327"},`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`};`

			`#if 0`
			`// This is not interesting for C/C++ as the data is already built beforehand`
			`// check build`
			`UnicodeSet ss = CanonicalIterator.getSafeStart();`
			`logln("Safe Start: " + ss.toPattern(true));`
			`ss = CanonicalIterator.getStarts('a');`
			`expectEqual("Characters with 'a' at the start of their decomposition: ", "", CanonicalIterator.getStarts('a'),`
			`new UnicodeSet("[\u00E0-\u00E5\u0101\u0103\u0105\u01CE\u01DF\u01E1\u01FB"`
			`+ "\u0201\u0203\u0227\u1E01\u1EA1\u1EA3\u1EA5\u1EA7\u1EA9\u1EAB\u1EAD\u1EAF\u1EB1\u1EB3\u1EB5\u1EB7]")`
ICU-1682 Fix for AIX, remove tabs, remove CVS tags. X-SVN-Rev: 8166 2002-03-20 23:47:53 +00:00			`);`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`#endif`
ICU-1682 faster exhaustive test for debug runs X-SVN-Rev: 8147 2002-03-20 05:14:00 +00:00
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`// check permute`
			`// NOTE: we use a TreeSet below to sort the output, which is not guaranteed to be sorted!`

			`Hashtable *permutations = new Hashtable(FALSE, status);`
			`permutations->setValueDeleter(uhash_deleteUnicodeString);`
ICU-1682 fixed 'permute' invokation to satisfy pedantic gcc X-SVN-Rev: 8112 2002-03-19 07:52:44 +00:00			`UnicodeString toPermute("ABC");`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00
ICU-1682 fixed 'permute' invokation to satisfy pedantic gcc X-SVN-Rev: 8112 2002-03-19 07:52:44 +00:00			`CanonicalIterator::permute(toPermute, FALSE, permutations, status);`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00
			`logln("testing permutation");`

			`expectEqual("Simple permutation ", "", collectionToString(permutations), "ABC, ACB, BAC, BCA, CAB, CBA");`

			`delete permutations;`

			`// try samples`
			`logln("testing samples");`
			`Hashtable *set = new Hashtable(FALSE, status);`
			`set->setValueDeleter(uhash_deleteUnicodeString);`
			`int32_t i = 0;`
			`CanonicalIterator it("", status);`
ICU-2840 tests shouldn't crash if there is no data X-SVN-Rev: 12340 2003-06-06 04:54:34 +00:00			`if(U_SUCCESS(status)) {`
			`for (i = 0; i < ARRAY_LENGTH(testArray); ++i) {`
			`//logln("Results for: " + name.transliterate(testArray[i]));`
			`UnicodeString testStr = CharsToUnicodeString(testArray[i][0]);`
			`it.setSource(testStr, status);`
			`set->removeAll();`
			`while (TRUE) {`
			`//UnicodeString *result = new UnicodeString(it.next());`
			`UnicodeString result(it.next());`
			`if (result.isBogus()) {`
			`break;`
			`}`
			`set->put(result, new UnicodeString(result), status); // Add result to the table`
			`//logln(++counter + ": " + hex.transliterate(result));`
			`//logln(" = " + name.transliterate(result));`
			`}`
			`expectEqual(i + ": ", testStr, collectionToString(set), CharsToUnicodeString(testArray[i][1]));`

			`}`
			`} else {`
			`errln("Couldn't instantiate canonical iterator. Error: %s", u_errorName(status));`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`}`
			`delete set;`
			`}`

ICU-4465 Change TestExhaustive to try the character with and without u+0345. X-SVN-Rev: 17442 2005-04-01 01:14:25 +00:00			`void CanonicalIteratorTest::characterTest(UnicodeString &s, UChar32 ch, CanonicalIterator &it)`
			`{`
			`UErrorCode status = U_ZERO_ERROR;`
			`UnicodeString decomp, comp;`
			`UBool gotDecomp = FALSE;`
			`UBool gotComp = FALSE;`
			`UBool gotSource = FALSE;`

ICU-5333 Whitespace changes. X-SVN-Rev: 20119 2006-08-20 05:08:35 +00:00			`Normalizer::decompose(s, FALSE, 0, decomp, status);`
ICU-4465 Change TestExhaustive to try the character with and without u+0345. X-SVN-Rev: 17442 2005-04-01 01:14:25 +00:00			`Normalizer::compose(s, FALSE, 0, comp, status);`

			`// skip characters that don't have either decomp.`
			`// need quick test for this!`
			`if (s == decomp && s == comp) {`
			`return;`
			`}`

			`it.setSource(s, status);`

			`while (TRUE) {`
			`UnicodeString item = it.next();`
			`if (item.isBogus()) break;`
			`if (item == s) gotSource = TRUE;`
			`if (item == decomp) gotDecomp = TRUE;`
			`if (item == comp) gotComp = TRUE;`
			`}`

			`if (!gotSource \|\| !gotDecomp \|\| !gotComp) {`
			`errln("FAIL CanonicalIterator: " + s + (int)ch);`
			`}`
			`}`

ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`void CanonicalIteratorTest::expectEqual(const UnicodeString &message, const UnicodeString &item, const UnicodeString &a, const UnicodeString &b) {`
			`if (!(a==b)) {`
ICU-1682 Fix for AIX, remove tabs, remove CVS tags. X-SVN-Rev: 8166 2002-03-20 23:47:53 +00:00			`errln("FAIL: " + message + getReadable(item));`
			`errln("\t" + getReadable(a));`
			`errln("\t" + getReadable(b));`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`} else {`
ICU-1682 Fix for AIX, remove tabs, remove CVS tags. X-SVN-Rev: 8166 2002-03-20 23:47:53 +00:00			`logln("Checked: " + message + getReadable(item));`
			`logln("\t" + getReadable(a));`
			`logln("\t" + getReadable(b));`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`}`
			`}`

			`UnicodeString CanonicalIteratorTest::getReadable(const UnicodeString &s) {`
			`UErrorCode status = U_ZERO_ERROR;`
			`UnicodeString result = "[";`
			`if (s.length() == 0) return "";`
			`// set up for readable display`
ICU-2248 modularize ICU X-SVN-Rev: 9910 2002-09-21 00:43:14 +00:00			`#if !UCONFIG_NO_TRANSLITERATION`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`if(verbose) {`
ICU-900 Fixed some compiler warnings. X-SVN-Rev: 8304 2002-03-29 19:56:29 +00:00			`if (nameTrans == NULL)`
			`nameTrans = Transliterator::createInstance("[^\\ -\\u007F] name", UTRANS_FORWARD, status);`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`UnicodeString sName = s;`
ICU-900 Fixed some compiler warnings. X-SVN-Rev: 8304 2002-03-29 19:56:29 +00:00			`nameTrans->transliterate(sName);`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`result += sName;`
			`result += ";";`
			`}`
ICU-900 Fixed some compiler warnings. X-SVN-Rev: 8304 2002-03-29 19:56:29 +00:00			`if (hexTrans == NULL)`
			`hexTrans = Transliterator::createInstance("[^\\ -\\u007F] hex", UTRANS_FORWARD, status);`
ICU-2248 modularize ICU X-SVN-Rev: 9910 2002-09-21 00:43:14 +00:00			`#endif`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`UnicodeString sHex = s;`
ICU-2248 modularize ICU X-SVN-Rev: 9910 2002-09-21 00:43:14 +00:00			`#if !UCONFIG_NO_TRANSLITERATION`
ICU-2840 tests shouldn't crash if there is no data X-SVN-Rev: 12340 2003-06-06 04:54:34 +00:00			`if(hexTrans) { // maybe there is no data and transliterator cannot be instantiated`
			`hexTrans->transliterate(sHex);`
			`}`
ICU-2248 modularize ICU X-SVN-Rev: 9910 2002-09-21 00:43:14 +00:00			`#endif`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`result += sHex;`
			`result += "]";`
			`return result;`
			`//return "[" + (verbose ? name->transliterate(s) + "; " : "") + hex->transliterate(s) + "]";`
			`}`

ICU-3946 Fix some tests to use U_EXPORT2 and U_CALLCONV more often X-SVN-Rev: 16021 2004-07-16 15:44:52 +00:00			`U_CFUNC int U_CALLCONV`
			`compareUnicodeStrings(const void s1, const void s2) {`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00			`UnicodeString st1 = (UnicodeString )s1;`
			`UnicodeString st2 = (UnicodeString )s2;`

			`return (st1)->compare(*st2);`
			`}`


			`UnicodeString CanonicalIteratorTest::collectionToString(Hashtable *col) {`
			`UnicodeString result;`

			`// Iterate over the Hashtable, then qsort.`

			`UnicodeString *resArray = new UnicodeString[col->count()];`
			`int32_t i = 0;`

			`const UHashElement *ne = NULL;`
			`int32_t el = -1;`
			`//Iterator it = basic.iterator();`
			`ne = col->nextElement(el);`
			`//while (it.hasNext())`
			`while (ne != NULL) {`
			`//String item = (String) it.next();`
			`UnicodeString item = (UnicodeString )(ne->value.pointer);`
			`resArray[i++] = item;`
			`ne = col->nextElement(el);`
			`}`

			`for(i = 0; i<col->count(); ++i) {`
			`logln(*resArray[i]);`
			`}`

			`qsort(resArray, col->count(), sizeof(UnicodeString *), compareUnicodeStrings);`

			`result = *resArray[0];`

			`for(i = 1; i<col->count(); ++i) {`
			`result += ", ";`
			`result += *resArray[i];`
			`}`

			`/*`
			`Iterator it = col.iterator();`
			`while (it.hasNext()) {`
			`if (result.length() != 0) result.append(", ");`
			`result.append(it.next().toString());`
			`}`
			`*/`

ICU-1682 (weiv) fixed a leak in canonical iterator test X-SVN-Rev: 8182 2002-03-21 19:38:00 +00:00			`delete [] resArray;`
ICU-1682 added a real test for canonical iterator X-SVN-Rev: 8110 2002-03-19 07:18:07 +00:00
			`return result;`
			`}`

ICU-2039 increase code coverage for canonical iterator X-SVN-Rev: 9471 2002-07-31 20:41:40 +00:00			`void CanonicalIteratorTest::TestAPI() {`
			`UErrorCode status = U_ZERO_ERROR;`
			`// Test reset and getSource`
			`UnicodeString start("ljubav");`
			`logln("Testing CanonicalIterator::getSource");`
			`logln("Instantiating canonical iterator with string "+start);`
			`CanonicalIterator can(start, status);`
			`UnicodeString source = can.getSource();`
			`logln("CanonicalIterator::getSource returned "+source);`
			`if(start != source) {`
			`errln("CanonicalIterator.getSource() didn't return the starting string. Expected "+start+", got "+source);`
			`}`
			`logln("Testing CanonicalIterator::reset");`
			`UnicodeString next = can.next();`
			`logln("CanonicalIterator::next returned "+next);`

			`can.reset();`

			`UnicodeString afterReset = can.next();`
			`logln("After reset, CanonicalIterator::next returned "+afterReset);`

			`if(next != afterReset) {`
			`errln("Next after instantiation ("+next+") is different from next after reset ("+afterReset+").");`
			`}`
ICU-2118 improve API coverage X-SVN-Rev: 10394 2002-11-27 02:40:34 +00:00
			`logln("Testing getStaticClassID and getDynamicClassID");`
			`if(can.getDynamicClassID() != CanonicalIterator::getStaticClassID()){`
			`errln("RTTI failed for CanonicalIterator getDynamicClassID != getStaticClassID");`
			`}`
ICU-2039 Add a newline at the end of the file. X-SVN-Rev: 9502 2002-08-01 02:03:12 +00:00			`}`

ICU-2860 add UCONFIG_NO_NORMALIZATION and UCONFIG_NO_IDNA X-SVN-Rev: 11808 2003-05-06 01:22:23 +00:00			`#endif /* #if !UCONFIG_NO_NORMALIZATION */`