scuffed-code/icu4c/source/i18n/tblcoll.cpp

/*
******************************************************************************
* Copyright <EFBFBD> {1996-2001}, International Business Machines Corporation and   *
* others. All Rights Reserved.                                               *     
******************************************************************************
*/

/**
* File tblcoll.cpp
*
* Created by: Helena Shih 
*
* Modification History:
*
*  Date        Name        Description
*  2/5/97      aliu        Added streamIn and streamOut methods.  Added
*                          constructor which reads RuleBasedCollator object from
*                          a binary file.  Added writeToFile method which streams
*                          RuleBasedCollator out to a binary file.  The streamIn
*                          and streamOut methods use istream and ostream objects
*                          in binary mode.
*  2/11/97     aliu        Moved declarations out of for loop initializer.
*                          Added Mac compatibility #ifdef for ios::nocreate.
*  2/12/97     aliu        Modified to use TableCollationData sub-object to
*                          hold invariant data.
*  2/13/97     aliu        Moved several methods into this class from Collation.
*                          Added a private RuleBasedCollator(Locale&) constructor,
*                          to be used by Collator::getInstance().  General
*                          clean up.  Made use of UErrorCode variables consistent.
*  2/20/97     helena      Added clone, operator==, operator!=, operator=, and copy
*                          constructor and getDynamicClassID.
*  3/5/97      aliu        Changed compaction cycle to improve performance.  We
*                          use the maximum allowable value which is kBlockCount.
*                          Modified getRules() to load rules dynamically.  Changed
*                          constructFromFile() call to accomodate this (added
*                          parameter to specify whether binary loading is to
*                          take place).
* 05/06/97     helena      Added memory allocation error check.
*  6/20/97     helena      Java class name change.
*  6/23/97     helena      Adding comments to make code more readable.
* 09/03/97     helena      Added createCollationKeyValues().
* 06/26/98     erm         Changes for CollationKeys using byte arrays.
* 08/10/98     erm         Synched with 1.2 version of RuleBasedCollator.java
* 04/23/99     stephen     Removed EDecompositionMode, merged with
*                          Normalizer::EMode
* 06/14/99     stephen     Removed kResourceBundleSuffix
* 06/22/99     stephen     Fixed logic in constructFromFile() since .ctx
*                          files are no longer used.
* 11/02/99     helena      Collator performance enhancements.  Special case
*                          for NO_OP situations. 
* 11/17/99     srl         More performance enhancements. Inlined some internal functions.
* 12/15/99     aliu        Update to support Thai collation.  Move NormalizerIterator
*                          to implementation file.
* 01/29/01     synwee      Modified into a C++ wrapper calling C APIs (ucol.h)
*/

#include "ucolimp.h"
#include "unicode/tblcoll.h"
#include "unicode/coleitr.h"
#include "uhash.h"
#include "unicode/resbund.h"

#ifdef _DEBUG
  #include "unistrm.h"
#endif

/* forward declarations ----------------------------------------------------- */

UChar forwardCharIteratorGlue(void *iterator);

/* global variable ---------------------------------------------------------- */

/*
synwee : using another name for this
const uint32_t tblcoll_StackBufferLen = 1024;
*/
const uint32_t StackBufferLen = 1024;

/* RuleBasedCollator declaration ----------------------------------------- */

/* ---------------------------------------------------------------------------
The following diagram shows the data structure of the RuleBasedCollator  object. 
Suppose we have the rule, where 'o-umlaut' is the unicode char 0x00F6. 
"a, A < b, B < c, C, ch, cH, Ch, CH < d, D ... < o, O; 
'o-umlaut'/E, 'O-umlaut'/E ...".
What the rule says is, sorts 'ch'ligatures and 'c' only with tertiary 
difference and sorts 'o-umlaut' as if it's always expanded with 'e'.

mapping table                 contracting list             expanding list
(contains all unicode 
char entries)               ___    ____________      _________________________
 ________                |=>|_*_|->|'c' |v('c') | |=>|v('o')|v('umlaut')|v('e')|
|_\u0001_|-> v('\u0001') |  |_:_|  |------------| |  |-------------------------|
|_\u0002_|-> v('\u0002') |  |_:_|  |'ch'|v('ch')| |  |             :           |
|____:___|               |  |_:_|  |------------| |  |-------------------------|
|____:___|               |         |'cH'|v('cH')| |  |             :           |
|__'a'___|-> v('a')      |         |------------| |  |-------------------------|
|__'b'___|-> v('b')      |         |'Ch'|v('Ch')| |  |             :           |
|____:___|               |         |------------| |  |-------------------------|
|____:___|               |         |'CH'|v('CH')| |  |             :           |
|___'c'__|----------------          ------------  |  |-------------------------|
|____:___|                                        |  |             :           |
|o-umlaut|----------------------------------------   |_________________________|
|____:___|

--------------------------------------------------------------------------- */

/* public RuleBasedCollator constructor ---------------------------------- */

/**
* Copy constructor
*/
RuleBasedCollator::RuleBasedCollator(const RuleBasedCollator& that) : 
              Collator(that), dataIsOwned(FALSE), ucollator(that.ucollator),
              urulestring(that.urulestring)
{
}

RuleBasedCollator::RuleBasedCollator(const UnicodeString& rules,
                                           UErrorCode& status) : 
                                           dataIsOwned(FALSE) 
{
  if (U_FAILURE(status))
    return;
 
  int32_t length = rules.length();

	UChar ucharrules[StackBufferLen];
	UChar *pucharrules = ucharrules;
	
  if (length >= StackBufferLen)
		pucharrules = new UChar[length + 1];
	
	rules.extract(0, length, pucharrules);
  pucharrules[length] = 0;

  ucollator = ucol_openRules(pucharrules, length, UCOL_DEFAULT_NORMALIZATION, 
                             UCOL_DEFAULT_STRENGTH, &status);
  
  if (U_SUCCESS(status))
  {
    const UChar *r = ucol_getRules(ucollator, &length);
    urulestring = new UnicodeString(r, length);
    
    dataIsOwned = TRUE;
  }
  
	if (pucharrules != ucharrules)
		delete[] pucharrules;
}

RuleBasedCollator::RuleBasedCollator(const UnicodeString& rules,
                      ECollationStrength collationStrength,
                      UErrorCode& status) : dataIsOwned(FALSE)
{
  if (U_FAILURE(status))
    return;
 
  int32_t length = rules.length();

	UChar ucharrules[StackBufferLen];
	UChar *pucharrules = ucharrules;
	
  if (length >= StackBufferLen)
		pucharrules = new UChar[length + 1];
	
	rules.extract(0, length, pucharrules);
  pucharrules[length] = 0;

  UCollationStrength strength = getUCollationStrength(collationStrength);
  ucollator = ucol_openRules(pucharrules, length, UCOL_DEFAULT_NORMALIZATION, 
                             strength, &status);

  if (U_SUCCESS(status))
  {
    const UChar *r = ucol_getRules(ucollator, &length);
    urulestring = new UnicodeString(r, length);
    dataIsOwned = TRUE;
  }
  
	if (pucharrules != ucharrules)
		delete[] pucharrules;
}

RuleBasedCollator::RuleBasedCollator(const UnicodeString& rules,
                                     Normalizer::EMode decompositionMode,
                                     UErrorCode& status) : 
                                     dataIsOwned(FALSE)
{
  if (U_FAILURE(status))
    return;
 
  int32_t length = rules.length();

	UChar ucharrules[StackBufferLen];
	UChar *pucharrules = ucharrules;
	
  if (length >= StackBufferLen)
		pucharrules = new UChar[length + 1];
	
	rules.extract(0, length, pucharrules);
  pucharrules[length] = 0;

  UNormalizationMode mode = Normalizer::getUNormalizationMode(
                                                   decompositionMode, status);
  ucollator = ucol_openRules(pucharrules, length, mode, 
                             UCOL_DEFAULT_STRENGTH, &status);

  if (U_SUCCESS(status))
  {
    const UChar *r = ucol_getRules(ucollator, &length);
    urulestring = new UnicodeString(r, length);
    dataIsOwned = TRUE;
  }
  
	if (pucharrules != ucharrules)
		delete[] pucharrules;
}

RuleBasedCollator::RuleBasedCollator(const UnicodeString& rules,
                      ECollationStrength collationStrength,
                      Normalizer::EMode decompositionMode,
                      UErrorCode& status) : dataIsOwned(FALSE)
{
  if (U_FAILURE(status))
    return;

  int32_t length = rules.length();

	UChar ucharrules[StackBufferLen];
	UChar *pucharrules = ucharrules;
	
  if (length >= StackBufferLen)
		pucharrules = new UChar[length + 1];
	
	rules.extract(0, length, pucharrules);
  pucharrules[length] = 0;

  UCollationStrength strength = getUCollationStrength(collationStrength);
  UNormalizationMode mode = Normalizer::getUNormalizationMode(
                                                   decompositionMode, status);
  ucollator = ucol_openRules(pucharrules, length, mode, strength, &status);
  if (U_SUCCESS(status))
  {
    const UChar *r = ucol_getRules(ucollator, &length);
    urulestring = new UnicodeString(r, length);
    dataIsOwned = TRUE;
  }

	if (pucharrules != ucharrules)
		delete[] pucharrules;
}


/* RuleBasedCollator public destructor ----------------------------------- */

RuleBasedCollator::~RuleBasedCollator()
{
  if (dataIsOwned)
  {
    ucol_close(ucollator);
    delete urulestring;
  }
  ucollator = NULL;
}

/* RuleBaseCollator public methods --------------------------------------- */

UBool RuleBasedCollator::operator==(const Collator& that) const
{
  /* only checks for address equals here */
  if (Collator::operator==(that))
    return TRUE;
    
  if (getDynamicClassID() != that.getDynamicClassID())
    return FALSE;  /* not the same class */
       
  RuleBasedCollator& thatAlias = (RuleBasedCollator&)that;

  /*
  synwee : orginal code does not check for data compatibility
  */
  if (ucollator != thatAlias.ucollator)
    return FALSE;
    
  return TRUE;
}

RuleBasedCollator& RuleBasedCollator::operator=(
                                              const RuleBasedCollator& that)
{
  if (this != &that)
  {
    if (dataIsOwned)
    {
      ucol_close(ucollator);
      ucollator = NULL;
      delete urulestring;
    }
    
    dataIsOwned = FALSE;
    ucollator = that.ucollator;
    urulestring = that.urulestring;
  }
  return *this;
}

Collator* RuleBasedCollator::clone() const
{
  return new RuleBasedCollator(*this);
}

/** 
* Create a CollationElementIterator object that will iterator over the 
* elements in a string, using the collation rules defined in this 
* RuleBasedCollator
*/
CollationElementIterator* RuleBasedCollator::createCollationElementIterator
                                           (const UnicodeString& source) const
{
  UErrorCode status = U_ZERO_ERROR;
  CollationElementIterator *result = new CollationElementIterator(source, this, 
                                                                  status);
  
  if (U_FAILURE(status))
    return NULL;
    
  return result;
}

/** 
* Create a CollationElementIterator object that will iterator over the 
* elements in a string, using the collation rules defined in this 
* RuleBasedCollator
*/
CollationElementIterator* RuleBasedCollator::createCollationElementIterator
                                       (const CharacterIterator& source) const
{
  UErrorCode status = U_ZERO_ERROR;
  CollationElementIterator *result = new CollationElementIterator(source, this, 
                                                                  status);
  
  if (U_FAILURE(status))
    return NULL;
    
  return result;
}

/** 
* Return a string representation of this collator's rules. The string can 
* later be passed to the constructor that takes a UnicodeString argument, 
* which will construct a collator that's functionally identical to this one. 
* You can also allow users to edit the string in order to change the collation 
* data, or you can print it out for inspection, or whatever.
*/
const UnicodeString& RuleBasedCollator::getRules() const
{
  return (*urulestring);
}

Collator::EComparisonResult RuleBasedCollator::compare(
                                               const UnicodeString& source,
                                               const UnicodeString& target,
                                               int32_t length) const
{
  UnicodeString source_togo;
  UnicodeString target_togo;
  UTextOffset begin=0;

  source.extract(begin, uprv_min(length,source.length()), source_togo);
  target.extract(begin, uprv_min(length,target.length()), target_togo);
  return compare(source_togo, target_togo);
}

Collator::EComparisonResult RuleBasedCollator::compare(const UChar* source, 
                                                       int32_t sourceLength,
                                                       const UChar* target,
                                                       int32_t targetLength) 
                                                       const
{
  return getEComparisonResult(ucol_strcoll(ucollator, source, sourceLength, 
                                                     target, targetLength));
}

/**
* Compare two strings using this collator
*/
Collator::EComparisonResult RuleBasedCollator::compare(
                                             const UnicodeString& source,
                                             const UnicodeString& target) const
{
  UChar uSstart[StackBufferLen];
	UChar uTstart[StackBufferLen];
	UChar *uSource = uSstart;
	UChar *uTarget = uTstart;
	uint32_t sourceLen = source.length();
	uint32_t targetLen = target.length();

	if(sourceLen >= StackBufferLen)
		uSource = new UChar[sourceLen+1];
	
	if(targetLen >= StackBufferLen)
		uTarget = new UChar[targetLen+1];
	
  source.extract(0, sourceLen, uSource);
  uSource[sourceLen] = 0;
  target.extract(0, targetLen, uTarget);
  uTarget[targetLen] = 0;
	EComparisonResult result = compare(uSource, sourceLen, uTarget, targetLen);

	if(uSstart != uSource)
		delete[] uSource;
	
	if(uTstart != uTarget)
		delete[] uTarget;
	
	return result;
}

/**
* Retrieve a collation key for the specified string. The key can be compared 
* with other collation keys using a bitwise comparison (e.g. memcmp) to find 
* the ordering of their respective source strings. This is handy when doing a 
* sort, where each sort key must be compared many times.
*
* The basic algorithm here is to find all of the collation elements for each
* character in the source string, convert them to an ASCII representation, and 
* put them into the collation key.  But it's trickier than that. Each 
* collation element in a string has three components: primary ('A' vs 'B'), 
* secondary ('u' vs '<EFBFBD>'), and tertiary ('A' vs 'a'), and a primary difference
* at the end of a string takes precedence over a secondary or tertiary 
* difference earlier in the string.
*
* To account for this, we put all of the primary orders at the beginning of 
* the string, followed by the secondary and tertiary orders. Each set of 
* orders is terminated by nulls so that a key for a string which is a initial 
* substring of another key will compare less without any special case.
*
* Here's a hypothetical example, with the collation element represented as a 
* three-digit number, one digit for primary, one for secondary, etc.
*
* String:              A     a     B    <EFBFBD>
* Collation Elements: 101   100   201  511
* Collation Key:      1125<null>0001<null>1011<null>
*
* To make things even trickier, secondary differences (accent marks) are 
* compared starting at the *end* of the string in languages with French 
* secondary ordering. But when comparing the accent marks on a single base 
* character, they are compared from the beginning. To handle this, we reverse 
* all of the accents that belong to each base character, then we reverse the 
* entire string of secondary orderings at the end.
*/
CollationKey& RuleBasedCollator::getCollationKey(
                                                  const UnicodeString& source,
                                                  CollationKey& sortkey,
                                                  UErrorCode& status) const
{
	UChar sStart[StackBufferLen];
	UChar *uSource = sStart;
	uint32_t sourceLen = source.length();

	if(sourceLen >= StackBufferLen)
		uSource = new UChar[sourceLen+1];
	
  source.extract(0, sourceLen, uSource);
  uSource[sourceLen] = 0;
	CollationKey& result = getCollationKey(uSource, sourceLen, sortkey, status);
	if(sStart != uSource)
		delete[] uSource;

	return result;
}

CollationKey& RuleBasedCollator::getCollationKey(const UChar* source,
                                                    int32_t sourceLen,
                                                    CollationKey& sortkey,
                                                    UErrorCode& status) const
{
  if (U_FAILURE(status))
  {
    status = U_ILLEGAL_ARGUMENT_ERROR;
    return sortkey.setToBogus();
  }
    
  if ((!source) || (sourceLen == 0))
    return sortkey.reset();
    
  uint8_t *result = new uint8_t[UCOL_MAX_BUFFER];
  uint8_t resLen = ucol_getSortKey(ucollator, source, sourceLen, result,
                                   UCOL_MAX_BUFFER);
  sortkey.adopt(result, resLen);
  
  return sortkey;
}

/**
 * Return the maximum length of any expansion sequences that end with the 
 * specified comparison order.
 * @param order a collation order returned by previous or next.
 * @return the maximum length of any expansion seuences ending with the 
 *         specified order.
 * @see CollationElementIterator#getMaxExpansion
 */
int32_t RuleBasedCollator::getMaxExpansion(int32_t order) const
{
  uint8_t result;
  UCOL_GETMAXEXPANSION(ucollator, (uint32_t)order, result);
  return result;
}

uint8_t* RuleBasedCollator::cloneRuleData(int32_t &length, 
                                              UErrorCode &status)
{
  return ucol_cloneRuleData(ucollator, &length, &status);
}

void RuleBasedCollator::setAttribute(UColAttribute attr, 
                                     UColAttributeValue value, 
                                     UErrorCode &status) 
{
  if (U_FAILURE(status))
    return;
  ucol_setAttribute(ucollator, attr, value, &status);
}

UColAttributeValue RuleBasedCollator::getAttribute(UColAttribute attr, 
                                                      UErrorCode &status) 
{
  if (U_FAILURE(status))
    return UCOL_DEFAULT;
  return ucol_getAttribute(ucollator, attr, &status);
}

Collator* RuleBasedCollator::safeClone(void) 
{
  UErrorCode intStatus = U_ZERO_ERROR;
  UCollator *ucol = ucol_safeClone(ucollator, NULL, 0, &intStatus);
  if (U_FAILURE(intStatus))
    return NULL;
  int32_t length = 0;
  UnicodeString *r = new UnicodeString(ucol_getRules(ucollator, &length), 
                                       length);
  RuleBasedCollator *result = new RuleBasedCollator(ucol, r);
  result->dataIsOwned = TRUE;
  return result;
}

Collator::EComparisonResult RuleBasedCollator::compare(
                                              ForwardCharacterIterator &source,
											                        ForwardCharacterIterator &target) 
{
  return getEComparisonResult(
    ucol_strcollinc(ucollator, forwardCharIteratorGlue, &source, 
                    forwardCharIteratorGlue, &target));
}

int32_t RuleBasedCollator::getSortKey(const UnicodeString& source, 
                                         uint8_t *result, int32_t resultLength) 
                                         const 
{
	UChar sStart[StackBufferLen];
	UChar *uSource = sStart;
	uint32_t sourceLen = source.length();
	if(sourceLen >= StackBufferLen)
		uSource = new UChar[sourceLen+1];
	
  source.extract(0, sourceLen, uSource);
  uSource[sourceLen] = 0;

	uint8_t resLen = ucol_getSortKey(ucollator, uSource, sourceLen, result,
                                   resultLength);
	if(sStart != uSource)
		delete[] uSource;

	return resLen;
}

int32_t RuleBasedCollator::getSortKey(const UChar *source, 
                                         int32_t sourceLength, uint8_t *result,
						                             int32_t resultLength) const 
{
	return ucol_getSortKey(ucollator, source, sourceLength, result, resultLength);
}

Collator::ECollationStrength RuleBasedCollator::getStrength(void) const
{
  UErrorCode intStatus = U_ZERO_ERROR;
  return getECollationStrength(ucol_getAttribute(ucollator, UCOL_STRENGTH, 
                               &intStatus));
}

void RuleBasedCollator::setStrength(ECollationStrength newStrength)
{
  UErrorCode intStatus = U_ZERO_ERROR;
  UCollationStrength strength = getUCollationStrength(newStrength);
  ucol_setAttribute(ucollator, UCOL_STRENGTH, strength, &intStatus);
}

/** 
* Create a hash code for this collation. Just hash the main rule table -- that 
* should be good enough for almost any use.
*/
int32_t RuleBasedCollator::hashCode() const
{
  int32_t length;
  const UChar *rules = ucol_getRules(ucollator, &length);
  return uhash_hashUCharsN(rules, length);
}

/**
* Set the decomposition mode of the Collator object. success is equal to 
* U_ILLEGAL_ARGUMENT_ERROR if error occurs.
* @param the new decomposition mode
* @see Collator#getDecomposition
*/
void RuleBasedCollator::setDecomposition(Normalizer::EMode  mode)
{
  UErrorCode status = U_ZERO_ERROR;
  ucol_setNormalization(ucollator, Normalizer::getUNormalizationMode(mode,
                                                                     status));
}

/**
* Get the decomposition mode of the Collator object.
* @return the decomposition mode
* @see Collator#setDecomposition
*/
Normalizer::EMode RuleBasedCollator::getDecomposition(void) const
{
  UErrorCode status = U_ZERO_ERROR;
  return Normalizer::getNormalizerEMode(ucol_getNormalization(ucollator), 
                                                              status);
}

// RuleBaseCollatorNew private constructor ----------------------------------

RuleBasedCollator::RuleBasedCollator() : dataIsOwned(FALSE)
{
}

RuleBasedCollator::RuleBasedCollator(UCollator *collator, 
                                     UnicodeString *rule) : dataIsOwned(FALSE)
{
  ucollator = collator;
  urulestring = rule;
}

RuleBasedCollator::RuleBasedCollator(const Locale& desiredLocale,
                                           UErrorCode& status) : 
                                           dataIsOwned(FALSE)
{
  if (U_FAILURE(status))
    return;

  /* 
  Try to load, in order:
   1. The desired locale's collation.
   2. A fallback of the desired locale.
   3. The default locale's collation.
   4. A fallback of the default locale.
   5. The default collation rules, which contains en_US collation rules.

   To reiterate, we try:
   Specific:
    language+country+variant
    language+country
    language
   Default:
    language+country+variant
    language+country
    language
   Root: (aka DEFAULTRULES)
   steps 1-5 are handled by resource bundle fallback mechanism. 
   however, in a very unprobable situation that no resource bundle
   data exists, step 5 is repeated with hardcoded default rules.
  */

  setUCollator(desiredLocale, status);

  if (U_FAILURE(status)) 
  {
    status = U_ZERO_ERROR;
   
    setUCollator(ResourceBundle::kDefaultFilename, status);
    if (U_FAILURE(status)) 
    {
      status = U_ZERO_ERROR;

      uint32_t size = 0;
      if (status == U_ZERO_ERROR)
        status = U_USING_DEFAULT_ERROR;
      
      if (status == U_MEMORY_ALLOCATION_ERROR)
        return;
    }
  }

  if (U_SUCCESS(status))
  {
    int32_t length;
    const UChar *r = ucol_getRules(ucollator, &length);
    urulestring = new UnicodeString(r, length);
    dataIsOwned = TRUE;
  }
  
  return;
}

/* RuleBasedCollator private data members -------------------------------- */

/* need look up in .commit() */
const int32_t RuleBasedCollator::CHARINDEX = 0x70000000;             
/* Expand index follows */
const int32_t RuleBasedCollator::EXPANDCHARINDEX = 0x7E000000;       
/* contract indexes follows */
const int32_t RuleBasedCollator::CONTRACTCHARINDEX = 0x7F000000;     
/* unmapped character values */
const int32_t RuleBasedCollator::UNMAPPED = 0xFFFFFFFF;              
/* primary strength increment */
const int32_t RuleBasedCollator::PRIMARYORDERINCREMENT = 0x00010000; 
/* secondary strength increment */
const int32_t RuleBasedCollator::SECONDARYORDERINCREMENT = 0x00000100;
/* tertiary strength increment */
const int32_t RuleBasedCollator::TERTIARYORDERINCREMENT = 0x00000001;
/* mask off anything but primary order */
const int32_t RuleBasedCollator::PRIMARYORDERMASK = 0xffff0000;      
/* mask off anything but secondary order */
const int32_t RuleBasedCollator::SECONDARYORDERMASK = 0x0000ff00;    
/* mask off anything but tertiary order */
const int32_t RuleBasedCollator::TERTIARYORDERMASK = 0x000000ff;     
/* mask off ignorable char order */
const int32_t RuleBasedCollator::IGNORABLEMASK = 0x0000ffff;         
/* use only the primary difference */
const int32_t RuleBasedCollator::PRIMARYDIFFERENCEONLY = 0xffff0000; 
/* use only the primary and secondary difference */
const int32_t RuleBasedCollator::SECONDARYDIFFERENCEONLY = 0xffffff00;  
/* primary order shift */
const int32_t RuleBasedCollator::PRIMARYORDERSHIFT = 16;             
/* secondary order shift */
const int32_t RuleBasedCollator::SECONDARYORDERSHIFT = 8;            
/* starting value for collation elements */
const int32_t RuleBasedCollator::COLELEMENTSTART = 0x02020202;       
/* testing mask for primary low element */
const int32_t RuleBasedCollator::PRIMARYLOWZEROMASK = 0x00FF0000;    
/* reseting value for secondaries and tertiaries */
const int32_t RuleBasedCollator::RESETSECONDARYTERTIARY = 0x00000202;
/* reseting value for tertiaries */
const int32_t RuleBasedCollator::RESETTERTIARY = 0x00000002;         

const int32_t RuleBasedCollator::PRIMIGNORABLE = 0x0202;

/* unique file id for parity check */
const int16_t RuleBasedCollator::FILEID = 0x5443;                    
/* binary collation file extension */
const char* RuleBasedCollator::kFilenameSuffix = ".col";             
/* class id ? Value is irrelevant */ 
char  RuleBasedCollator::fgClassID = 0; 

/* other methods not belonging to any classes ------------------------------- */

UChar forwardCharIteratorGlue(void *iterator) 
{
  ForwardCharacterIterator *iter = ((ForwardCharacterIterator *)iterator);
  UChar result = iter->nextPostInc();
  if (result == ForwardCharacterIterator::DONE)
    return 0xFFFF;
  else
    return result;
}
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								/*
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								******************************************************************************
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								* Copyright <EFBFBD> {1996-2001}, International Business Machines Corporation and   *
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								* others. All Rights Reserved.                                               *
 								******************************************************************************
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								*/
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								/**
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								* File tblcoll.cpp
 								*
 								* Created by: Helena Shih
 								*
 								* Modification History:
 								*
 								*  Date        Name        Description
 								*  2/5/97      aliu        Added streamIn and streamOut methods.  Added
 								*                          constructor which reads RuleBasedCollator object from
 								*                          a binary file.  Added writeToFile method which streams
 								*                          RuleBasedCollator out to a binary file.  The streamIn
 								*                          and streamOut methods use istream and ostream objects
 								*                          in binary mode.
 								*  2/11/97     aliu        Moved declarations out of for loop initializer.
 								*                          Added Mac compatibility #ifdef for ios::nocreate.
 								*  2/12/97     aliu        Modified to use TableCollationData sub-object to
 								*                          hold invariant data.
 								*  2/13/97     aliu        Moved several methods into this class from Collation.
 								*                          Added a private RuleBasedCollator(Locale&) constructor,
 								*                          to be used by Collator::getInstance().  General
 								*                          clean up.  Made use of UErrorCode variables consistent.
 								*  2/20/97     helena      Added clone, operator==, operator!=, operator=, and copy
 								*                          constructor and getDynamicClassID.
 								*  3/5/97      aliu        Changed compaction cycle to improve performance.  We
 								*                          use the maximum allowable value which is kBlockCount.
 								*                          Modified getRules() to load rules dynamically.  Changed
 								*                          constructFromFile() call to accomodate this (added
 								*                          parameter to specify whether binary loading is to
 								*                          take place).
 								* 05/06/97     helena      Added memory allocation error check.
 								*  6/20/97     helena      Java class name change.
 								*  6/23/97     helena      Adding comments to make code more readable.
 								* 09/03/97     helena      Added createCollationKeyValues().
 								* 06/26/98     erm         Changes for CollationKeys using byte arrays.
 								* 08/10/98     erm         Synched with 1.2 version of RuleBasedCollator.java
 								* 04/23/99     stephen     Removed EDecompositionMode, merged with
 								*                          Normalizer::EMode
 								* 06/14/99     stephen     Removed kResourceBundleSuffix
 								* 06/22/99     stephen     Fixed logic in constructFromFile() since .ctx
 								*                          files are no longer used.
 								* 11/02/99     helena      Collator performance enhancements.  Special case
 								*                          for NO_OP situations.
 								* 11/17/99     srl         More performance enhancements. Inlined some internal functions.
 								* 12/15/99     aliu        Update to support Thai collation.  Move NormalizerIterator
 								*                          to implementation file.
 								* 01/29/01     synwee      Modified into a C++ wrapper calling C APIs (ucol.h)
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								*/
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-96 collation key adopt, ucol_createSortKey, fix for collation key hash code, C++ incremental compare implementation

X-SVN-Rev: 3196
											
										
										
											2000-12-12 01:15:30 +00:00
+								#include "ucolimp.h"
-												ICU-96 cleanup, comments, debugging

X-SVN-Rev: 3222
											
										
										
											2000-12-14 01:11:11 +00:00
+								#include "unicode/tblcoll.h"
-												ICU-12 all public include files are now in unicode dir, all private icu_ functions renamed to uprv_

X-SVN-Rev: 473
											
										
										
											1999-12-28 23:57:50 +00:00
+								#include "unicode/coleitr.h"
-												ICU-807 
Modified include statement for uhash.h to make as400 happy.

X-SVN-Rev: 3702
											
										
										
											2001-02-21 01:59:39 +00:00
+								#include "uhash.h"
-												ICU-12 all public include files are now in unicode dir, all private icu_ functions renamed to uprv_

X-SVN-Rev: 473
											
										
										
											1999-12-28 23:57:50 +00:00
+								#include "unicode/resbund.h"
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
 								#ifdef _DEBUG
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  #include "unistrm.h"
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								#endif
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* forward declarations ----------------------------------------------------- */
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								UChar forwardCharIteratorGlue(void *iterator);
-												ICU-96 performance improvements

X-SVN-Rev: 247
											
										
										
											1999-11-23 22:49:29 +00:00
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* global variable ---------------------------------------------------------- */
-												ICU-420 missed some..

X-SVN-Rev: 1559
											
										
										
											2000-06-03 04:37:12 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								/*
 								synwee : using another name for this
-												ICU-96 new implementation for sortkey generation and compare is active. Expect errors in tests

X-SVN-Rev: 2983
											
										
										
											2000-11-22 00:04:03 +00:00
+								const uint32_t tblcoll_StackBufferLen = 1024;
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								*/
 								const uint32_t StackBufferLen = 1024;
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* RuleBasedCollator declaration ----------------------------------------- */
 								/* ---------------------------------------------------------------------------
 								The following diagram shows the data structure of the RuleBasedCollator  object.
 								Suppose we have the rule, where 'o-umlaut' is the unicode char 0x00F6.
 								"a, A < b, B < c, C, ch, cH, Ch, CH < d, D ... < o, O;
 								'o-umlaut'/E, 'O-umlaut'/E ...".
 								What the rule says is, sorts 'ch'ligatures and 'c' only with tertiary
 								difference and sorts 'o-umlaut' as if it's always expanded with 'e'.
 								mapping table                 contracting list             expanding list
 								(contains all unicode
 								char entries)               ___    ____________      _________________________
 								 ________                |=>|_*_|->|'c' |v('c') | |=>|v('o')|v('umlaut')|v('e')|
 								|_\u0001_|-> v('\u0001') |  |_:_|  |------------| |  |-------------------------|
 								|_\u0002_|-> v('\u0002') |  |_:_|  |'ch'|v('ch')| |  |             :           |
 								|____:___|               |  |_:_|  |------------| |  |-------------------------|
 								|____:___|               |         |'cH'|v('cH')| |  |             :           |
 								|__'a'___|-> v('a')      |         |------------| |  |-------------------------|
 								|__'b'___|-> v('b')      |         |'Ch'|v('Ch')| |  |             :           |
 								|____:___|               |         |------------| |  |-------------------------|
 								|____:___|               |         |'CH'|v('CH')| |  |             :           |
 								|___'c'__|----------------          ------------  |  |-------------------------|
 								|____:___|                                        |  |             :           |
 								|o-umlaut|----------------------------------------   |_________________________|
 								|____:___|
 								--------------------------------------------------------------------------- */
 								/* public RuleBasedCollator constructor ---------------------------------- */
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								/**
 								* Copy constructor
-												ICU-159 Thai collation

X-SVN-Rev: 426
											
										
										
											1999-12-16 01:41:19 +00:00
+								*/
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								RuleBasedCollator::RuleBasedCollator(const RuleBasedCollator& that) :
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								              Collator(that), dataIsOwned(FALSE), ucollator(that.ucollator),
 								              urulestring(that.urulestring)
-												ICU-159 Thai collation

X-SVN-Rev: 426
											
										
										
											1999-12-16 01:41:19 +00:00
+								{
 								}
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								RuleBasedCollator::RuleBasedCollator(const UnicodeString& rules,
 								                                           UErrorCode& status) :
 								                                           dataIsOwned(FALSE)
-												ICU-159 Thai collation

X-SVN-Rev: 426
											
										
										
											1999-12-16 01:41:19 +00:00
+								{
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  if (U_FAILURE(status))
 								    return;
 								  int32_t length = rules.length();
-												ICU-159 Thai collation

X-SVN-Rev: 426
											
										
										
											1999-12-16 01:41:19 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+									UChar ucharrules[StackBufferLen];
 									UChar *pucharrules = ucharrules;
 								  if (length >= StackBufferLen)
 										pucharrules = new UChar[length + 1];
 									rules.extract(0, length, pucharrules);
 								  pucharrules[length] = 0;
-												ICU-159 Thai collation

X-SVN-Rev: 426
											
										
										
											1999-12-16 01:41:19 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  ucollator = ucol_openRules(pucharrules, length, UCOL_DEFAULT_NORMALIZATION,
 								                             UCOL_DEFAULT_STRENGTH, &status);
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  if (U_SUCCESS(status))
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  {
 								    const UChar *r = ucol_getRules(ucollator, &length);
 								    urulestring = new UnicodeString(r, length);
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								    dataIsOwned = TRUE;
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  }
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
 									if (pucharrules != ucharrules)
 										delete[] pucharrules;
-												ICU-159 Thai collation

X-SVN-Rev: 426
											
										
										
											1999-12-16 01:41:19 +00:00
+								}
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								RuleBasedCollator::RuleBasedCollator(const UnicodeString& rules,
 								                      ECollationStrength collationStrength,
 								                      UErrorCode& status) : dataIsOwned(FALSE)
-												ICU-159 Thai collation

X-SVN-Rev: 426
											
										
										
											1999-12-16 01:41:19 +00:00
+								{
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  if (U_FAILURE(status))
 								    return;
 								  int32_t length = rules.length();
-												ICU-159 Thai collation

X-SVN-Rev: 426
											
										
										
											1999-12-16 01:41:19 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+									UChar ucharrules[StackBufferLen];
 									UChar *pucharrules = ucharrules;
 								  if (length >= StackBufferLen)
 										pucharrules = new UChar[length + 1];
 									rules.extract(0, length, pucharrules);
 								  pucharrules[length] = 0;
-												ICU-159 Thai collation

X-SVN-Rev: 426
											
										
										
											1999-12-16 01:41:19 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  UCollationStrength strength = getUCollationStrength(collationStrength);
 								  ucollator = ucol_openRules(pucharrules, length, UCOL_DEFAULT_NORMALIZATION,
 								                             strength, &status);
 								  if (U_SUCCESS(status))
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  {
 								    const UChar *r = ucol_getRules(ucollator, &length);
 								    urulestring = new UnicodeString(r, length);
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								    dataIsOwned = TRUE;
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  }
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
 									if (pucharrules != ucharrules)
 										delete[] pucharrules;
-												ICU-159 Thai collation

X-SVN-Rev: 426
											
										
										
											1999-12-16 01:41:19 +00:00
+								}
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								RuleBasedCollator::RuleBasedCollator(const UnicodeString& rules,
 								                                     Normalizer::EMode decompositionMode,
 								                                     UErrorCode& status) :
 								                                     dataIsOwned(FALSE)
-												ICU-159 Thai collation

X-SVN-Rev: 426
											
										
										
											1999-12-16 01:41:19 +00:00
+								{
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  if (U_FAILURE(status))
 								    return;
 								  int32_t length = rules.length();
-												ICU-159 Thai collation

X-SVN-Rev: 426
											
										
										
											1999-12-16 01:41:19 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+									UChar ucharrules[StackBufferLen];
 									UChar *pucharrules = ucharrules;
 								  if (length >= StackBufferLen)
 										pucharrules = new UChar[length + 1];
 									rules.extract(0, length, pucharrules);
 								  pucharrules[length] = 0;
-												ICU-159 Thai collation

X-SVN-Rev: 426
											
										
										
											1999-12-16 01:41:19 +00:00
-												ICU-833 
Because of the new Normalization enum conversion methods, changes have
to be done in tbcoll.

X-SVN-Rev: 3553
											
										
										
											2001-02-03 01:27:02 +00:00
+								  UNormalizationMode mode = Normalizer::getUNormalizationMode(
 								                                                   decompositionMode, status);
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  ucollator = ucol_openRules(pucharrules, length, mode,
 								                             UCOL_DEFAULT_STRENGTH, &status);
-												ICU-159 Thai collation

X-SVN-Rev: 426
											
										
										
											1999-12-16 01:41:19 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  if (U_SUCCESS(status))
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  {
 								    const UChar *r = ucol_getRules(ucollator, &length);
 								    urulestring = new UnicodeString(r, length);
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								    dataIsOwned = TRUE;
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  }
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
 									if (pucharrules != ucharrules)
 										delete[] pucharrules;
-												ICU-159 Thai collation

X-SVN-Rev: 426
											
										
										
											1999-12-16 01:41:19 +00:00
+								}
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								RuleBasedCollator::RuleBasedCollator(const UnicodeString& rules,
 								                      ECollationStrength collationStrength,
 								                      Normalizer::EMode decompositionMode,
 								                      UErrorCode& status) : dataIsOwned(FALSE)
-												ICU-159 Thai collation

X-SVN-Rev: 426
											
										
										
											1999-12-16 01:41:19 +00:00
+								{
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  if (U_FAILURE(status))
 								    return;
-												ICU-96 Inline function RuleBasedCollator::makeReorderedBuffer
called before being defined.  Fixed it.

X-SVN-Rev: 572
											
										
										
											2000-01-13 21:36:39 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  int32_t length = rules.length();
-												ICU-96 Inline function RuleBasedCollator::makeReorderedBuffer
called before being defined.  Fixed it.

X-SVN-Rev: 572
											
										
										
											2000-01-13 21:36:39 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+									UChar ucharrules[StackBufferLen];
 									UChar *pucharrules = ucharrules;
 								  if (length >= StackBufferLen)
 										pucharrules = new UChar[length + 1];
 									rules.extract(0, length, pucharrules);
 								  pucharrules[length] = 0;
 								  UCollationStrength strength = getUCollationStrength(collationStrength);
-												ICU-833 
Because of the new Normalization enum conversion methods, changes have
to be done in tbcoll.

X-SVN-Rev: 3553
											
										
										
											2001-02-03 01:27:02 +00:00
+								  UNormalizationMode mode = Normalizer::getUNormalizationMode(
 								                                                   decompositionMode, status);
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  ucollator = ucol_openRules(pucharrules, length, mode, strength, &status);
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  if (U_SUCCESS(status))
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  {
 								    const UChar *r = ucol_getRules(ucollator, &length);
 								    urulestring = new UnicodeString(r, length);
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								    dataIsOwned = TRUE;
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  }
-												ICU-96 Inline function RuleBasedCollator::makeReorderedBuffer
called before being defined.  Fixed it.

X-SVN-Rev: 572
											
										
										
											2000-01-13 21:36:39 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+									if (pucharrules != ucharrules)
 										delete[] pucharrules;
-												ICU-96 Inline function RuleBasedCollator::makeReorderedBuffer
called before being defined.  Fixed it.

X-SVN-Rev: 572
											
										
										
											2000-01-13 21:36:39 +00:00
+								}
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* RuleBasedCollator public destructor ----------------------------------- */
-												ICU-96 Inline function RuleBasedCollator::makeReorderedBuffer
called before being defined.  Fixed it.

X-SVN-Rev: 572
											
										
										
											2000-01-13 21:36:39 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								RuleBasedCollator::~RuleBasedCollator()
-												ICU-96 performance improvements

X-SVN-Rev: 247
											
										
										
											1999-11-23 22:49:29 +00:00
+								{
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  if (dataIsOwned)
 								  {
 								    ucol_close(ucollator);
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								    delete urulestring;
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  }
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  ucollator = NULL;
-												ICU-96 performance improvements

X-SVN-Rev: 247
											
										
										
											1999-11-23 22:49:29 +00:00
+								}
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* RuleBaseCollator public methods --------------------------------------- */
-												ICU-96 performance improvements

X-SVN-Rev: 247
											
										
										
											1999-11-23 22:49:29 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								UBool RuleBasedCollator::operator==(const Collator& that) const
-												ICU-96 performance improvements

X-SVN-Rev: 247
											
										
										
											1999-11-23 22:49:29 +00:00
+								{
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								  /* only checks for address equals here */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  if (Collator::operator==(that))
 								    return TRUE;
 								  if (getDynamicClassID() != that.getDynamicClassID())
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								    return FALSE;  /* not the same class */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
 								  RuleBasedCollator& thatAlias = (RuleBasedCollator&)that;
-												ICU-96 performance improvements

X-SVN-Rev: 247
											
										
										
											1999-11-23 22:49:29 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  /*
 								  synwee : orginal code does not check for data compatibility
 								  */
 								  if (ucollator != thatAlias.ucollator)
 								    return FALSE;
-												ICU-96 performance improvements

X-SVN-Rev: 247
											
										
										
											1999-11-23 22:49:29 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  return TRUE;
 								}
-												ICU-96 performance improvements

X-SVN-Rev: 247
											
										
										
											1999-11-23 22:49:29 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								RuleBasedCollator& RuleBasedCollator::operator=(
 								                                              const RuleBasedCollator& that)
 								{
 								  if (this != &that)
 								  {
 								    if (dataIsOwned)
-												ICU-96 performance improvements

X-SVN-Rev: 247
											
										
										
											1999-11-23 22:49:29 +00:00
+								    {
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								      ucol_close(ucollator);
 								      ucollator = NULL;
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								      delete urulestring;
-												ICU-96 performance improvements

X-SVN-Rev: 247
											
										
										
											1999-11-23 22:49:29 +00:00
+								    }
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
 								    dataIsOwned = FALSE;
 								    ucollator = that.ucollator;
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								    urulestring = that.urulestring;
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  }
 								  return *this;
-												ICU-96 performance improvements

X-SVN-Rev: 247
											
										
										
											1999-11-23 22:49:29 +00:00
+								}
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								Collator* RuleBasedCollator::clone() const
 								{
 								  return new RuleBasedCollator(*this);
 								}
-												ICU-96 performance improvements

X-SVN-Rev: 247
											
										
										
											1999-11-23 22:49:29 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								/**
 								* Create a CollationElementIterator object that will iterator over the
 								* elements in a string, using the collation rules defined in this
 								* RuleBasedCollator
 								*/
 								CollationElementIterator* RuleBasedCollator::createCollationElementIterator
 								                                           (const UnicodeString& source) const
 								{
 								  UErrorCode status = U_ZERO_ERROR;
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  CollationElementIterator *result = new CollationElementIterator(source, this,
 								                                                                  status);
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
 								  if (U_FAILURE(status))
 								    return NULL;
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  return result;
-												ICU-96 Better memory management in sort key, safe clone implementation

X-SVN-Rev: 3162
											
										
										
											2000-12-07 07:22:55 +00:00
+								}
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								/**
 								* Create a CollationElementIterator object that will iterator over the
 								* elements in a string, using the collation rules defined in this
 								* RuleBasedCollator
 								*/
 								CollationElementIterator* RuleBasedCollator::createCollationElementIterator
 								                                       (const CharacterIterator& source) const
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								{
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  UErrorCode status = U_ZERO_ERROR;
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  CollationElementIterator *result = new CollationElementIterator(source, this,
 								                                                                  status);
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
 								  if (U_FAILURE(status))
 								    return NULL;
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  return result;
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								}
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								/**
 								* Return a string representation of this collator's rules. The string can
 								* later be passed to the constructor that takes a UnicodeString argument,
 								* which will construct a collator that's functionally identical to this one.
 								* You can also allow users to edit the string in order to change the collation
 								* data, or you can print it out for inspection, or whatever.
 								*/
 								const UnicodeString& RuleBasedCollator::getRules() const
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								{
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  return (*urulestring);
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								}
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								Collator::EComparisonResult RuleBasedCollator::compare(
 								                                               const UnicodeString& source,
 								                                               const UnicodeString& target,
 								                                               int32_t length) const
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								{
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  UnicodeString source_togo;
 								  UnicodeString target_togo;
 								  UTextOffset begin=0;
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  source.extract(begin, uprv_min(length,source.length()), source_togo);
 								  target.extract(begin, uprv_min(length,target.length()), target_togo);
 								  return compare(source_togo, target_togo);
 								}
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								Collator::EComparisonResult RuleBasedCollator::compare(const UChar* source,
 								                                                       int32_t sourceLength,
 								                                                       const UChar* target,
 								                                                       int32_t targetLength)
 								                                                       const
 								{
 								  return getEComparisonResult(ucol_strcoll(ucollator, source, sourceLength,
 								                                                     target, targetLength));
 								}
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								/**
 								* Compare two strings using this collator
 								*/
 								Collator::EComparisonResult RuleBasedCollator::compare(
 								                                             const UnicodeString& source,
 								                                             const UnicodeString& target) const
 								{
 								  UChar uSstart[StackBufferLen];
 									UChar uTstart[StackBufferLen];
 									UChar *uSource = uSstart;
 									UChar *uTarget = uTstart;
 									uint32_t sourceLen = source.length();
 									uint32_t targetLen = target.length();
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+									if(sourceLen >= StackBufferLen)
 										uSource = new UChar[sourceLen+1];
 									if(targetLen >= StackBufferLen)
 										uTarget = new UChar[targetLen+1];
 								  source.extract(0, sourceLen, uSource);
 								  uSource[sourceLen] = 0;
 								  target.extract(0, targetLen, uTarget);
 								  uTarget[targetLen] = 0;
 									EComparisonResult result = compare(uSource, sourceLen, uTarget, targetLen);
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+									if(uSstart != uSource)
 										delete[] uSource;
 									if(uTstart != uTarget)
 										delete[] uTarget;
 									return result;
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								}
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								/**
 								* Retrieve a collation key for the specified string. The key can be compared
 								* with other collation keys using a bitwise comparison (e.g. memcmp) to find
 								* the ordering of their respective source strings. This is handy when doing a
 								* sort, where each sort key must be compared many times.
 								*
 								* The basic algorithm here is to find all of the collation elements for each
 								* character in the source string, convert them to an ASCII representation, and
 								* put them into the collation key.  But it's trickier than that. Each
 								* collation element in a string has three components: primary ('A' vs 'B'),
 								* secondary ('u' vs '<EFBFBD>'), and tertiary ('A' vs 'a'), and a primary difference
 								* at the end of a string takes precedence over a secondary or tertiary
 								* difference earlier in the string.
 								*
 								* To account for this, we put all of the primary orders at the beginning of
 								* the string, followed by the secondary and tertiary orders. Each set of
 								* orders is terminated by nulls so that a key for a string which is a initial
 								* substring of another key will compare less without any special case.
 								*
 								* Here's a hypothetical example, with the collation element represented as a
 								* three-digit number, one digit for primary, one for secondary, etc.
 								*
 								* String:              A     a     B    <EFBFBD>
 								* Collation Elements: 101   100   201  511
 								* Collation Key:      1125<null>0001<null>1011<null>
 								*
 								* To make things even trickier, secondary differences (accent marks) are
 								* compared starting at the *end* of the string in languages with French
 								* secondary ordering. But when comparing the accent marks on a single base
 								* character, they are compared from the beginning. To handle this, we reverse
 								* all of the accents that belong to each base character, then we reverse the
 								* entire string of secondary orderings at the end.
 								*/
 								CollationKey& RuleBasedCollator::getCollationKey(
 								                                                  const UnicodeString& source,
 								                                                  CollationKey& sortkey,
 								                                                  UErrorCode& status) const
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								{
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+									UChar sStart[StackBufferLen];
 									UChar *uSource = sStart;
 									uint32_t sourceLen = source.length();
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+									if(sourceLen >= StackBufferLen)
 										uSource = new UChar[sourceLen+1];
 								  source.extract(0, sourceLen, uSource);
 								  uSource[sourceLen] = 0;
 									CollationKey& result = getCollationKey(uSource, sourceLen, sortkey, status);
 									if(sStart != uSource)
 										delete[] uSource;
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+									return result;
 								}
-												ICU-96 cleanup, comments, debugging

X-SVN-Rev: 3222
											
										
										
											2000-12-14 01:11:11 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								CollationKey& RuleBasedCollator::getCollationKey(const UChar* source,
 								                                                    int32_t sourceLen,
 								                                                    CollationKey& sortkey,
 								                                                    UErrorCode& status) const
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								{
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  if (U_FAILURE(status))
 								  {
 								    status = U_ILLEGAL_ARGUMENT_ERROR;
 								    return sortkey.setToBogus();
 								  }
 								  if ((!source) || (sourceLen == 0))
 								    return sortkey.reset();
 								  uint8_t *result = new uint8_t[UCOL_MAX_BUFFER];
 								  uint8_t resLen = ucol_getSortKey(ucollator, source, sourceLen, result,
 								                                   UCOL_MAX_BUFFER);
 								  sortkey.adopt(result, resLen);
 								  return sortkey;
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								}
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								/**
 								 * Return the maximum length of any expansion sequences that end with the
 								 * specified comparison order.
 								 * @param order a collation order returned by previous or next.
 								 * @return the maximum length of any expansion seuences ending with the
 								 *         specified order.
 								 * @see CollationElementIterator#getMaxExpansion
 								 */
 								int32_t RuleBasedCollator::getMaxExpansion(int32_t order) const
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								{
-												ICU-878 
Added getMaxExpansion to collator

X-SVN-Rev: 3871
											
										
										
											2001-03-02 01:14:03 +00:00
+								  uint8_t result;
 								  UCOL_GETMAXEXPANSION(ucollator, (uint32_t)order, result);
 								  return result;
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								}
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								uint8_t* RuleBasedCollator::cloneRuleData(int32_t &length,
 								                                              UErrorCode &status)
 								{
 								  return ucol_cloneRuleData(ucollator, &length, &status);
 								}
-												ICU-96 cleanup, comments, debugging

X-SVN-Rev: 3222
											
										
										
											2000-12-14 01:11:11 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								void RuleBasedCollator::setAttribute(UColAttribute attr,
 								                                     UColAttributeValue value,
 								                                     UErrorCode &status)
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								{
-												ICU-6 more renaming of constant names
FAILURE -> U_FAILURE etc.

X-SVN-Rev: 76
											
										
										
											1999-10-18 22:48:32 +00:00
+								  if (U_FAILURE(status))
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								    return;
 								  ucol_setAttribute(ucollator, attr, value, &status);
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								}
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								UColAttributeValue RuleBasedCollator::getAttribute(UColAttribute attr,
 								                                                      UErrorCode &status)
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								{
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  if (U_FAILURE(status))
 								    return UCOL_DEFAULT;
 								  return ucol_getAttribute(ucollator, attr, &status);
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								}
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								Collator* RuleBasedCollator::safeClone(void)
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								{
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  UErrorCode intStatus = U_ZERO_ERROR;
 								  UCollator *ucol = ucol_safeClone(ucollator, NULL, 0, &intStatus);
 								  if (U_FAILURE(intStatus))
 								    return NULL;
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  int32_t length = 0;
 								  UnicodeString *r = new UnicodeString(ucol_getRules(ucollator, &length),
 								                                       length);
 								  RuleBasedCollator *result = new RuleBasedCollator(ucol, r);
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  result->dataIsOwned = TRUE;
 								  return result;
 								}
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								Collator::EComparisonResult RuleBasedCollator::compare(
 								                                              ForwardCharacterIterator &source,
 																			                        ForwardCharacterIterator &target)
 								{
 								  return getEComparisonResult(
 								    ucol_strcollinc(ucollator, forwardCharIteratorGlue, &source,
 								                    forwardCharIteratorGlue, &target));
 								}
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								int32_t RuleBasedCollator::getSortKey(const UnicodeString& source,
 								                                         uint8_t *result, int32_t resultLength)
 								                                         const
 								{
 									UChar sStart[StackBufferLen];
 									UChar *uSource = sStart;
 									uint32_t sourceLen = source.length();
 									if(sourceLen >= StackBufferLen)
 										uSource = new UChar[sourceLen+1];
 								  source.extract(0, sourceLen, uSource);
 								  uSource[sourceLen] = 0;
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+									uint8_t resLen = ucol_getSortKey(ucollator, uSource, sourceLen, result,
 								                                   resultLength);
 									if(sStart != uSource)
 										delete[] uSource;
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+									return resLen;
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								}
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								int32_t RuleBasedCollator::getSortKey(const UChar *source,
 								                                         int32_t sourceLength, uint8_t *result,
 														                             int32_t resultLength) const
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								{
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+									return ucol_getSortKey(ucollator, source, sourceLength, result, resultLength);
 								}
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								Collator::ECollationStrength RuleBasedCollator::getStrength(void) const
 								{
 								  UErrorCode intStatus = U_ZERO_ERROR;
 								  return getECollationStrength(ucol_getAttribute(ucollator, UCOL_STRENGTH,
 								                               &intStatus));
 								}
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								void RuleBasedCollator::setStrength(ECollationStrength newStrength)
 								{
 								  UErrorCode intStatus = U_ZERO_ERROR;
 								  UCollationStrength strength = getUCollationStrength(newStrength);
 								  ucol_setAttribute(ucollator, UCOL_STRENGTH, strength, &intStatus);
 								}
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								/**
 								* Create a hash code for this collation. Just hash the main rule table -- that
 								* should be good enough for almost any use.
 								*/
 								int32_t RuleBasedCollator::hashCode() const
 								{
 								  int32_t length;
 								  const UChar *rules = ucol_getRules(ucollator, &length);
 								  return uhash_hashUCharsN(rules, length);
 								}
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								/**
 								* Set the decomposition mode of the Collator object. success is equal to
 								* U_ILLEGAL_ARGUMENT_ERROR if error occurs.
 								* @param the new decomposition mode
 								* @see Collator#getDecomposition
 								*/
 								void RuleBasedCollator::setDecomposition(Normalizer::EMode  mode)
 								{
-												ICU-833 
Because of the new Normalization enum conversion methods, changes have
to be done in tbcoll.

X-SVN-Rev: 3553
											
										
										
											2001-02-03 01:27:02 +00:00
+								  UErrorCode status = U_ZERO_ERROR;
 								  ucol_setNormalization(ucollator, Normalizer::getUNormalizationMode(mode,
 								                                                                     status));
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								}
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								/**
 								* Get the decomposition mode of the Collator object.
 								* @return the decomposition mode
 								* @see Collator#setDecomposition
 								*/
 								Normalizer::EMode RuleBasedCollator::getDecomposition(void) const
 								{
-												ICU-833 
Because of the new Normalization enum conversion methods, changes have
to be done in tbcoll.

X-SVN-Rev: 3553
											
										
										
											2001-02-03 01:27:02 +00:00
+								  UErrorCode status = U_ZERO_ERROR;
 								  return Normalizer::getNormalizerEMode(ucol_getNormalization(ucollator),
 								                                                              status);
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								}
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								// RuleBaseCollatorNew private constructor ----------------------------------
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								RuleBasedCollator::RuleBasedCollator() : dataIsOwned(FALSE)
 								{
 								}
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								RuleBasedCollator::RuleBasedCollator(UCollator *collator,
 								                                     UnicodeString *rule) : dataIsOwned(FALSE)
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								{
 								  ucollator = collator;
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  urulestring = rule;
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								}
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								RuleBasedCollator::RuleBasedCollator(const Locale& desiredLocale,
 								                                           UErrorCode& status) :
 								                                           dataIsOwned(FALSE)
-												ICU-406 putting collation in resource bundles (initial revision)

X-SVN-Rev: 1426
											
										
										
											2000-05-22 19:49:10 +00:00
+								{
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  if (U_FAILURE(status))
 								    return;
-												ICU-96 Better memory management in sort key, safe clone implementation

X-SVN-Rev: 3162
											
										
										
											2000-12-07 07:22:55 +00:00
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								  /*
 								  Try to load, in order:
 . The desired locale's collation.
 . A fallback of the desired locale.
 . The default locale's collation.
 . A fallback of the default locale.
 . The default collation rules, which contains en_US collation rules.
 								   To reiterate, we try:
 								   Specific:
 								    language+country+variant
 								    language+country
 								    language
 								   Default:
 								    language+country+variant
 								    language+country
 								    language
 								   Root: (aka DEFAULTRULES)
 								   steps 1-5 are handled by resource bundle fallback mechanism.
 								   however, in a very unprobable situation that no resource bundle
 								   data exists, step 5 is repeated with hardcoded default rules.
 								  */
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  setUCollator(desiredLocale, status);
-												ICU-535 fixed some compiler warnings

X-SVN-Rev: 2181
											
										
										
											2000-08-11 01:27:17 +00:00
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  if (U_FAILURE(status))
-												ICU-96 pathname cleanup

X-SVN-Rev: 286
											
										
										
											1999-12-03 02:51:54 +00:00
+								  {
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								    status = U_ZERO_ERROR;
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								    setUCollator(ResourceBundle::kDefaultFilename, status);
 								    if (U_FAILURE(status))
-												ICU-501 Collation enhancement phase 1.  Added "override" and "version" tag in "CollationElements".

X-SVN-Rev: 1882
											
										
										
											2000-07-14 22:31:35 +00:00
+								    {
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								      status = U_ZERO_ERROR;
-												ICU-856 1.8 integration [aix]

X-SVN-Rev: 3635
											
										
										
											2001-02-15 23:43:26 +00:00
+								      uint32_t size = 0;
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								      if (status == U_ZERO_ERROR)
 								        status = U_USING_DEFAULT_ERROR;
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								      if (status == U_MEMORY_ALLOCATION_ERROR)
 								        return;
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								    }
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  }
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  if (U_SUCCESS(status))
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  {
 								    int32_t length;
 								    const UChar *r = ucol_getRules(ucollator, &length);
 								    urulestring = new UnicodeString(r, length);
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								    dataIsOwned = TRUE;
-												ICU-807 Added comment header

X-SVN-Rev: 3493
											
										
										
											2001-01-30 18:52:58 +00:00
+								  }
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
 								  return;
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								}
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* RuleBasedCollator private data members -------------------------------- */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* need look up in .commit() */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::CHARINDEX = 0x70000000;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* Expand index follows */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::EXPANDCHARINDEX = 0x7E000000;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* contract indexes follows */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::CONTRACTCHARINDEX = 0x7F000000;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* unmapped character values */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::UNMAPPED = 0xFFFFFFFF;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* primary strength increment */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::PRIMARYORDERINCREMENT = 0x00010000;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* secondary strength increment */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::SECONDARYORDERINCREMENT = 0x00000100;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* tertiary strength increment */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::TERTIARYORDERINCREMENT = 0x00000001;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* mask off anything but primary order */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::PRIMARYORDERMASK = 0xffff0000;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* mask off anything but secondary order */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::SECONDARYORDERMASK = 0x0000ff00;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* mask off anything but tertiary order */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::TERTIARYORDERMASK = 0x000000ff;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* mask off ignorable char order */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::IGNORABLEMASK = 0x0000ffff;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* use only the primary difference */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::PRIMARYDIFFERENCEONLY = 0xffff0000;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* use only the primary and secondary difference */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::SECONDARYDIFFERENCEONLY = 0xffffff00;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* primary order shift */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::PRIMARYORDERSHIFT = 16;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* secondary order shift */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::SECONDARYORDERSHIFT = 8;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* starting value for collation elements */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::COLELEMENTSTART = 0x02020202;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* testing mask for primary low element */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::PRIMARYLOWZEROMASK = 0x00FF0000;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* reseting value for secondaries and tertiaries */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::RESETSECONDARYTERTIARY = 0x00000202;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* reseting value for tertiaries */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::RESETTERTIARY = 0x00000002;
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int32_t RuleBasedCollator::PRIMIGNORABLE = 0x0202;
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* unique file id for parity check */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const int16_t RuleBasedCollator::FILEID = 0x5443;
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* binary collation file extension */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								const char* RuleBasedCollator::kFilenameSuffix = ".col";
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* class id ? Value is irrelevant */
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								char  RuleBasedCollator::fgClassID = 0;
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
-												ICU-833 
Replaced quickcheck with checkFCD

X-SVN-Rev: 3633
											
										
										
											2001-02-15 19:30:25 +00:00
+								/* other methods not belonging to any classes ------------------------------- */
-												ICU-96 new implementation for sortkey generation and compare is active. Expect errors in tests

X-SVN-Rev: 2983
											
										
										
											2000-11-22 00:04:03 +00:00
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								UChar forwardCharIteratorGlue(void *iterator)
-												ICU-96 new implementation for sortkey generation and compare is active. Expect errors in tests

X-SVN-Rev: 2983
											
										
										
											2000-11-22 00:04:03 +00:00
+								{
-												ICU-807 Committed by Syn Wee. New C++ wrappers implementation for C Collation codes ucol.cpp, ucoleitr.cpp.

X-SVN-Rev: 3434
											
										
										
											2001-01-18 00:23:29 +00:00
+								  ForwardCharacterIterator *iter = ((ForwardCharacterIterator *)iterator);
 								  UChar result = iter->nextPostInc();
 								  if (result == ForwardCharacterIterator::DONE)
 								    return 0xFFFF;
 								  else
-												Initial revision

X-SVN-Rev: 2
											
										
										
											1999-08-16 21:50:52 +00:00
+								    return result;
 								}