scuffed-code/icu4c/source/i18n/brkiter.cpp

/*
*******************************************************************************
* Copyright (C) 1997-2001, International Business Machines Corporation and    *
* others. All Rights Reserved.                                                *
*******************************************************************************
*
* File TXTBDRY.CPP
*
* Modification History:
*
*   Date        Name        Description
*   02/18/97    aliu        Converted from OpenClass.  Added DONE.
*   01/13/2000  helena      Added UErrorCode parameter to createXXXInstance methods.
*****************************************************************************************
*/

// *****************************************************************************
// This file was generated from the java source file BreakIterator.java
// *****************************************************************************

#include "unicode/dbbi.h"
#include "unicode/brkiter.h"
#include "unicode/udata.h"
#include "unicode/resbund.h"
#include "cstring.h"
#include <string.h>

// *****************************************************************************
// class BreakIterator
// This class implements methods for finding the location of boundaries in text. 
// Instances of BreakIterator maintain a current position and scan over text
// returning the index of characters where boundaries occur.
// *****************************************************************************

const UTextOffset BreakIterator::DONE = (int32_t)-1;

// -------------------------------------

// Creates a simple text boundary for word breaks.
BreakIterator*
BreakIterator::createWordInstance(const Locale& key, UErrorCode& status)
{
    // WARNING: This routine is currently written specifically to handle only the
    // default rules files and the alternate rules files for Thai.  This function
    // will have to be made fully general at some time in the future!
    BreakIterator* result = NULL;
    const char* filename = "word";

    UnicodeString temp;
    if (U_FAILURE(status)) return NULL;
    if (!uprv_strcmp(key.getLanguage(), "th"))
    {
        filename = "word_th";
    }

    UDataMemory* file = udata_open(NULL, "brk", filename, &status);

    if (!U_FAILURE(status)) {

            if(!uprv_strcmp(filename, "word_th")) {
                filename = "thaidict.brk";

                result = new DictionaryBasedBreakIterator(file, (char *)filename, status);
            }
            else {
	      result = new RuleBasedBreakIterator(file);
            }
    }
    
    return result;
}

// -------------------------------------

// Creates a simple text boundary for line breaks.
BreakIterator*
BreakIterator::createLineInstance(const Locale& key, UErrorCode& status)
{
    // WARNING: This routine is currently written specifically to handle only the
    // default rules files and the alternate rules files for Thai.  This function
    // will have to be made fully general at some time in the future!
    BreakIterator* result = NULL;
    const char* filename = "line";

    UnicodeString temp;
    if (U_FAILURE(status)) return NULL;
    if (!uprv_strcmp(key.getLanguage(), "th"))
    {
        filename = "line_th";
    }

    UDataMemory* file = udata_open(NULL, "brk", filename, &status);

    if (!U_FAILURE(status)) {

          if (!uprv_strcmp(key.getLanguage(), "th")) {
                const char* dataDir = u_getDataDirectory();
                filename = "thaidict.brk";
                result = new DictionaryBasedBreakIterator(file, (char *)filename, status);
            }
            else {
                result = new RuleBasedBreakIterator(file);
            }
    }
    

    return result;
}

// -------------------------------------

// Creates a simple text boundary for character breaks.
BreakIterator*
BreakIterator::createCharacterInstance(const Locale& key, UErrorCode& status)
{
    // WARNING: This routine is currently written specifically to handle only the
    // default rules files and the alternate rules files for Thai.  This function
    // will have to be made fully general at some time in the future!
    BreakIterator* result = NULL;
    const char* filename = "char";

    if (U_FAILURE(status)) return NULL;
    UDataMemory* file = udata_open(NULL, "brk", filename, &status);

    if (!U_FAILURE(status)) {
	  result = new RuleBasedBreakIterator(file);
    }
    

    return result;
}

// -------------------------------------

// Creates a simple text boundary for sentence breaks.
BreakIterator*
BreakIterator::createSentenceInstance(const Locale& key, UErrorCode& status)
{
    // WARNING: This routine is currently written specifically to handle only the
    // default rules files and the alternate rules files for Thai.  This function
    // will have to be made fully general at some time in the future!
    BreakIterator* result = NULL;
    const char* filename = "sent";

    if (U_FAILURE(status)) return NULL;
    UDataMemory* file = udata_open(NULL, "brk", filename, &status);

    if (!U_FAILURE(status)) {
	  result = new RuleBasedBreakIterator(file);
    }
    
    return result;
}

// -------------------------------------

// Gets all the available locales that has localized text boundary data.
const Locale*
BreakIterator::getAvailableLocales(int32_t& count)
{
    return Locale::getAvailableLocales(count);
}

// -------------------------------------
// Gets the objectLocale display name in the default locale language.
UnicodeString&
BreakIterator::getDisplayName(const Locale& objectLocale,
                             UnicodeString& name)
{
    return objectLocale.getDisplayName(name);
}

// -------------------------------------
// Gets the objectLocale display name in the displayLocale language.
UnicodeString&
BreakIterator::getDisplayName(const Locale& objectLocale,
                             const Locale& displayLocale,
                             UnicodeString& name)
{
    return objectLocale.getDisplayName(displayLocale, name);
}

// -------------------------------------

// Needed because we declare the copy constructor (in order to prevent synthesizing one) and
// so the default constructor is no longer synthesized.

BreakIterator::BreakIterator()
{
    fBufferClone = FALSE;
}

BreakIterator::~BreakIterator()
{
}

//eof
Initial revision X-SVN-Rev: 2 1999-08-16 21:50:52 +00:00			`/*`
ICU-161 changed copyright notice X-SVN-Rev: 220 1999-11-22 20:25:35 +00:00			`*******************************************************************************`
ICU-903 updated copyright notices X-SVN-Rev: 4237 2001-03-21 20:31:13 +00:00			`* Copyright (C) 1997-2001, International Business Machines Corporation and *`
ICU-161 changed copyright notice X-SVN-Rev: 220 1999-11-22 20:25:35 +00:00			`* others. All Rights Reserved. *`
			`*******************************************************************************`
Initial revision X-SVN-Rev: 2 1999-08-16 21:50:52 +00:00			`*`
			`* File TXTBDRY.CPP`
			`*`
			`* Modification History:`
			`*`
			`* Date Name Description`
			`* 02/18/97 aliu Converted from OpenClass. Added DONE.`
ICU-45 Added ErrorCode to the constructor APIs. . X-SVN-Rev: 578 2000-01-14 00:13:59 +00:00			`* 01/13/2000 helena Added UErrorCode parameter to createXXXInstance methods.`
Initial revision X-SVN-Rev: 2 1999-08-16 21:50:52 +00:00			`*****************************************************************************************`
			`*/`

			`// *****************************************************************************`
			`// This file was generated from the java source file BreakIterator.java`
			`// *****************************************************************************`

ICU-45 Fixed the include path problems. X-SVN-Rev: 507 2000-01-10 21:21:52 +00:00			`#include "unicode/dbbi.h"`
ICU-12 all public include files are now in unicode dir, all private icu_ functions renamed to uprv_ X-SVN-Rev: 473 1999-12-28 23:57:50 +00:00			`#include "unicode/brkiter.h"`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00			`#include "unicode/udata.h"`
ICU-45 Fixed the include path problems. X-SVN-Rev: 507 2000-01-10 21:21:52 +00:00			`#include "unicode/resbund.h"`
ICU-185 don't call Locale(UnicodeString..) deprecated apis X-SVN-Rev: 1135 2000-04-15 21:23:28 +00:00			`#include "cstring.h"`
Initial revision X-SVN-Rev: 2 1999-08-16 21:50:52 +00:00			`#include <string.h>`

			`// *****************************************************************************`
			`// class BreakIterator`
			`// This class implements methods for finding the location of boundaries in text.`
			`// Instances of BreakIterator maintain a current position and scan over text`
			`// returning the index of characters where boundaries occur.`
			`// *****************************************************************************`

			`const UTextOffset BreakIterator::DONE = (int32_t)-1;`

			`// -------------------------------------`

			`// Creates a simple text boundary for word breaks.`
			`BreakIterator*`
ICU-45 Added ErrorCode to the constructor APIs. . X-SVN-Rev: 578 2000-01-14 00:13:59 +00:00			`BreakIterator::createWordInstance(const Locale& key, UErrorCode& status)`
Initial revision X-SVN-Rev: 2 1999-08-16 21:50:52 +00:00			`{`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00			`// WARNING: This routine is currently written specifically to handle only the`
			`// default rules files and the alternate rules files for Thai. This function`
			`// will have to be made fully general at some time in the future!`
			`BreakIterator* result = NULL;`
			`const char* filename = "word";`

			`UnicodeString temp;`
ICU-45 Added ErrorCode to the constructor APIs. . X-SVN-Rev: 578 2000-01-14 00:13:59 +00:00			`if (U_FAILURE(status)) return NULL;`
ICU-185 don't call Locale(UnicodeString..) deprecated apis X-SVN-Rev: 1135 2000-04-15 21:23:28 +00:00			`if (!uprv_strcmp(key.getLanguage(), "th"))`
			`{`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00			`filename = "word_th";`
			`}`

ICU-45 Added ErrorCode to the constructor APIs. . X-SVN-Rev: 578 2000-01-14 00:13:59 +00:00			`UDataMemory* file = udata_open(NULL, "brk", filename, &status);`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00
ICU-45 Added ErrorCode to the constructor APIs. . X-SVN-Rev: 578 2000-01-14 00:13:59 +00:00			`if (!U_FAILURE(status)) {`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00
ICU-185 don't call Locale(UnicodeString..) deprecated apis X-SVN-Rev: 1135 2000-04-15 21:23:28 +00:00			`if(!uprv_strcmp(filename, "word_th")) {`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00			`filename = "thaidict.brk";`
ICU-489 breakiterator now uses binary type in resb for thai X-SVN-Rev: 1772 2000-07-10 20:16:27 +00:00
ICU-458 breakiterator & co should now close opened udata instances X-SVN-Rev: 1801 2000-07-12 05:01:53 +00:00			`result = new DictionaryBasedBreakIterator(file, (char *)filename, status);`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00			`}`
			`else {`
ICU-458 breakiterator & co should now close opened udata instances X-SVN-Rev: 1801 2000-07-12 05:01:53 +00:00			`result = new RuleBasedBreakIterator(file);`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00			`}`
			`}`

			`return result;`
Initial revision X-SVN-Rev: 2 1999-08-16 21:50:52 +00:00			`}`

			`// -------------------------------------`

			`// Creates a simple text boundary for line breaks.`
			`BreakIterator*`
ICU-45 Added ErrorCode to the constructor APIs. . X-SVN-Rev: 578 2000-01-14 00:13:59 +00:00			`BreakIterator::createLineInstance(const Locale& key, UErrorCode& status)`
Initial revision X-SVN-Rev: 2 1999-08-16 21:50:52 +00:00			`{`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00			`// WARNING: This routine is currently written specifically to handle only the`
			`// default rules files and the alternate rules files for Thai. This function`
			`// will have to be made fully general at some time in the future!`
			`BreakIterator* result = NULL;`
			`const char* filename = "line";`

			`UnicodeString temp;`
ICU-45 Added ErrorCode to the constructor APIs. . X-SVN-Rev: 578 2000-01-14 00:13:59 +00:00			`if (U_FAILURE(status)) return NULL;`
ICU-185 don't call Locale(UnicodeString..) deprecated apis X-SVN-Rev: 1135 2000-04-15 21:23:28 +00:00			`if (!uprv_strcmp(key.getLanguage(), "th"))`
			`{`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00			`filename = "line_th";`
			`}`

ICU-45 Added ErrorCode to the constructor APIs. . X-SVN-Rev: 578 2000-01-14 00:13:59 +00:00			`UDataMemory* file = udata_open(NULL, "brk", filename, &status);`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00
ICU-45 Added ErrorCode to the constructor APIs. . X-SVN-Rev: 578 2000-01-14 00:13:59 +00:00			`if (!U_FAILURE(status)) {`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00
ICU-185 don't call Locale(UnicodeString..) deprecated apis X-SVN-Rev: 1135 2000-04-15 21:23:28 +00:00			`if (!uprv_strcmp(key.getLanguage(), "th")) {`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00			`const char* dataDir = u_getDataDirectory();`
			`filename = "thaidict.brk";`
ICU-458 breakiterator & co should now close opened udata instances X-SVN-Rev: 1801 2000-07-12 05:01:53 +00:00			`result = new DictionaryBasedBreakIterator(file, (char *)filename, status);`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00			`}`
			`else {`
ICU-458 breakiterator & co should now close opened udata instances X-SVN-Rev: 1801 2000-07-12 05:01:53 +00:00			`result = new RuleBasedBreakIterator(file);`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00			`}`
			`}`

ICU-432 fixing leaks X-SVN-Rev: 1649 2000-06-26 22:46:15 +00:00
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00			`return result;`
Initial revision X-SVN-Rev: 2 1999-08-16 21:50:52 +00:00			`}`

			`// -------------------------------------`

			`// Creates a simple text boundary for character breaks.`
			`BreakIterator*`
ICU-45 Added ErrorCode to the constructor APIs. . X-SVN-Rev: 578 2000-01-14 00:13:59 +00:00			`BreakIterator::createCharacterInstance(const Locale& key, UErrorCode& status)`
Initial revision X-SVN-Rev: 2 1999-08-16 21:50:52 +00:00			`{`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00			`// WARNING: This routine is currently written specifically to handle only the`
			`// default rules files and the alternate rules files for Thai. This function`
			`// will have to be made fully general at some time in the future!`
			`BreakIterator* result = NULL;`
			`const char* filename = "char";`

ICU-45 Added ErrorCode to the constructor APIs. . X-SVN-Rev: 578 2000-01-14 00:13:59 +00:00			`if (U_FAILURE(status)) return NULL;`
			`UDataMemory* file = udata_open(NULL, "brk", filename, &status);`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00
ICU-45 Added ErrorCode to the constructor APIs. . X-SVN-Rev: 578 2000-01-14 00:13:59 +00:00			`if (!U_FAILURE(status)) {`
ICU-458 breakiterator & co should now close opened udata instances X-SVN-Rev: 1801 2000-07-12 05:01:53 +00:00			`result = new RuleBasedBreakIterator(file);`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00			`}`

ICU-432 fixing leaks X-SVN-Rev: 1649 2000-06-26 22:46:15 +00:00
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00			`return result;`
Initial revision X-SVN-Rev: 2 1999-08-16 21:50:52 +00:00			`}`

			`// -------------------------------------`

			`// Creates a simple text boundary for sentence breaks.`
			`BreakIterator*`
ICU-45 Added ErrorCode to the constructor APIs. . X-SVN-Rev: 578 2000-01-14 00:13:59 +00:00			`BreakIterator::createSentenceInstance(const Locale& key, UErrorCode& status)`
Initial revision X-SVN-Rev: 2 1999-08-16 21:50:52 +00:00			`{`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00			`// WARNING: This routine is currently written specifically to handle only the`
			`// default rules files and the alternate rules files for Thai. This function`
			`// will have to be made fully general at some time in the future!`
			`BreakIterator* result = NULL;`
			`const char* filename = "sent";`

ICU-45 Added ErrorCode to the constructor APIs. . X-SVN-Rev: 578 2000-01-14 00:13:59 +00:00			`if (U_FAILURE(status)) return NULL;`
			`UDataMemory* file = udata_open(NULL, "brk", filename, &status);`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00
ICU-45 Added ErrorCode to the constructor APIs. . X-SVN-Rev: 578 2000-01-14 00:13:59 +00:00			`if (!U_FAILURE(status)) {`
ICU-458 breakiterator & co should now close opened udata instances X-SVN-Rev: 1801 2000-07-12 05:01:53 +00:00			`result = new RuleBasedBreakIterator(file);`
ICU-45 Initial check-in of RuleBasedBreakIterator and DictionaryBasedBreakIterator. X-SVN-Rev: 502 2000-01-08 02:05:05 +00:00			`}`

			`return result;`
Initial revision X-SVN-Rev: 2 1999-08-16 21:50:52 +00:00			`}`

			`// -------------------------------------`

			`// Gets all the available locales that has localized text boundary data.`
			`const Locale*`
			`BreakIterator::getAvailableLocales(int32_t& count)`
			`{`
			`return Locale::getAvailableLocales(count);`
			`}`

			`// -------------------------------------`
			`// Gets the objectLocale display name in the default locale language.`
			`UnicodeString&`
			`BreakIterator::getDisplayName(const Locale& objectLocale,`
			`UnicodeString& name)`
			`{`
			`return objectLocale.getDisplayName(name);`
			`}`

			`// -------------------------------------`
			`// Gets the objectLocale display name in the displayLocale language.`
			`UnicodeString&`
			`BreakIterator::getDisplayName(const Locale& objectLocale,`
			`const Locale& displayLocale,`
			`UnicodeString& name)`
			`{`
			`return objectLocale.getDisplayName(displayLocale, name);`
			`}`

			`// -------------------------------------`

			`// Needed because we declare the copy constructor (in order to prevent synthesizing one) and`
			`// so the default constructor is no longer synthesized.`

			`BreakIterator::BreakIterator()`
			`{`
ICU-853 Implementations for ubrk_safeClone, including C++ API changes needed (createBufferClone & isBufferClone in BreakIterator classes) X-SVN-Rev: 3713 2001-02-21 23:40:41 +00:00			`fBufferClone = FALSE;`
Initial revision X-SVN-Rev: 2 1999-08-16 21:50:52 +00:00			`}`

			`BreakIterator::~BreakIterator()`
			`{`
			`}`

			`//eof`