scuffed-code/icu4c/source/common/unifilt.cpp

/*
**********************************************************************
* Copyright (c) 2001-2004, International Business Machines
* Corporation and others.  All Rights Reserved.
**********************************************************************
*   Date        Name        Description
*   07/18/01    aliu        Creation.
**********************************************************************
*/

#include "unicode/unifilt.h"
#include "unicode/rep.h"

U_NAMESPACE_BEGIN
UOBJECT_DEFINE_ABSTRACT_RTTI_IMPLEMENTATION(UnicodeFilter)


/* Define this here due to the lack of another file.
   It can't be defined in the header */
UnicodeMatcher::~UnicodeMatcher() {}

UnicodeFilter::~UnicodeFilter() {}

/**
 * UnicodeFunctor API.  Cast 'this' to a UnicodeMatcher* pointer
 * and return the pointer.
 */
UnicodeMatcher* UnicodeFilter::toMatcher() const {
    return (UnicodeMatcher*) this;
}

void UnicodeFilter::setData(const TransliterationRuleData*) {}

/**
 * Default implementation of UnicodeMatcher::matches() for Unicode
 * filters.  Matches a single code point at offset (either one or
 * two 16-bit code units).
 */
UMatchDegree UnicodeFilter::matches(const Replaceable& text,
                                    int32_t& offset,
                                    int32_t limit,
                                    UBool incremental) {
    UChar32 c;
    if (offset < limit &&
        contains(c = text.char32At(offset))) {
        offset += UTF_CHAR_LENGTH(c);
        return U_MATCH;
    }
    if (offset > limit &&
        contains(c = text.char32At(offset))) {
        // Backup offset by 1, unless the preceding character is a
        // surrogate pair -- then backup by 2 (keep offset pointing at
        // the lead surrogate).
        --offset;
        if (offset >= 0) {
            offset -= UTF_CHAR_LENGTH(text.char32At(offset)) - 1;
        }
        return U_MATCH;
    }
    if (incremental && offset == limit) {
        return U_PARTIAL_MATCH;
    }
    return U_MISMATCH;
}

U_NAMESPACE_END

//eof
ICU-1052 redesign of engine to support supplemental characters X-SVN-Rev: 5340 2001-07-25 18:50:09 +00:00			`/*`
ICU-3221 Fix the AIX linker warning about multiple definitions of virtual functions. X-SVN-Rev: 12958 2003-08-27 01:01:42 +00:00			`**********************************************************************`
ICU-4179 update copyright notices for ICU 3.2 X-SVN-Rev: 16681 2004-10-29 22:50:01 +00:00			`* Copyright (c) 2001-2004, International Business Machines`
ICU-3221 Fix the AIX linker warning about multiple definitions of virtual functions. X-SVN-Rev: 12958 2003-08-27 01:01:42 +00:00			`* Corporation and others. All Rights Reserved.`
ICU-1052 redesign of engine to support supplemental characters X-SVN-Rev: 5340 2001-07-25 18:50:09 +00:00			`**********************************************************************`
			`* Date Name Description`
			`* 07/18/01 aliu Creation.`
			`**********************************************************************`
			`*/`

			`#include "unicode/unifilt.h"`
			`#include "unicode/rep.h"`

ICU-1264 added namspace support where possible. X-SVN-Rev: 6124 2001-10-08 23:26:58 +00:00			`U_NAMESPACE_BEGIN`
ICU-3783 Make getDynamicClassID() pure virutal on abstract classes. X-SVN-Rev: 15705 2004-06-04 01:16:05 +00:00			`UOBJECT_DEFINE_ABSTRACT_RTTI_IMPLEMENTATION(UnicodeFilter)`
ICU-3783 restore getStaticClassID() to several classes from which it had been removed in error. X-SVN-Rev: 15619 2004-05-28 20:13:11 +00:00
ICU-1264 added namspace support where possible. X-SVN-Rev: 6124 2001-10-08 23:26:58 +00:00
ICU-3221 Fix the AIX linker warning about multiple definitions of virtual functions. X-SVN-Rev: 12958 2003-08-27 01:01:42 +00:00			`/* Define this here due to the lack of another file.`
			`It can't be defined in the header */`
			`UnicodeMatcher::~UnicodeMatcher() {}`

			`UnicodeFilter::~UnicodeFilter() {}`
ICU-1962 change UObject: RTTI pure virtual, remove other boilerplate for now X-SVN-Rev: 8977 2002-06-29 00:04:16 +00:00
ICU-1234 make output side of RBTs object-oriented; rewrite ID parsers and modularize them; implement &Any-Lower() support X-SVN-Rev: 7582 2002-02-07 01:07:55 +00:00			`/**`
			`* UnicodeFunctor API. Cast 'this' to a UnicodeMatcher* pointer`
			`* and return the pointer.`
			`*/`
			`UnicodeMatcher* UnicodeFilter::toMatcher() const {`
			`return (UnicodeMatcher*) this;`
			`}`

ICU-3221 Fix the AIX linker warning about multiple definitions of virtual functions. X-SVN-Rev: 12958 2003-08-27 01:01:42 +00:00			`void UnicodeFilter::setData(const TransliterationRuleData*) {}`

ICU-1052 redesign of engine to support supplemental characters X-SVN-Rev: 5340 2001-07-25 18:50:09 +00:00			`/**`
			`* Default implementation of UnicodeMatcher::matches() for Unicode`
ICU-1533 update docs per Doug's review X-SVN-Rev: 7005 2001-11-20 00:41:01 +00:00			`* filters. Matches a single code point at offset (either one or`
			`* two 16-bit code units).`
ICU-1052 redesign of engine to support supplemental characters X-SVN-Rev: 5340 2001-07-25 18:50:09 +00:00			`*/`
			`UMatchDegree UnicodeFilter::matches(const Replaceable& text,`
			`int32_t& offset,`
			`int32_t limit,`
ICU-1406 make UnicodeMatcher::matches non-const X-SVN-Rev: 6503 2001-10-30 23:55:09 +00:00			`UBool incremental) {`
ICU-1052 redesign of engine to support supplemental characters X-SVN-Rev: 5340 2001-07-25 18:50:09 +00:00			`UChar32 c;`
			`if (offset < limit &&`
			`contains(c = text.char32At(offset))) {`
			`offset += UTF_CHAR_LENGTH(c);`
			`return U_MATCH;`
			`}`
			`if (offset > limit &&`
ICU-1052 fix handling of surrogates in antecontext and cursor positioning X-SVN-Rev: 5346 2001-07-25 21:15:53 +00:00			`contains(c = text.char32At(offset))) {`
			`// Backup offset by 1, unless the preceding character is a`
			`// surrogate pair -- then backup by 2 (keep offset pointing at`
			`// the lead surrogate).`
			`--offset;`
			`if (offset >= 0) {`
			`offset -= UTF_CHAR_LENGTH(text.char32At(offset)) - 1;`
			`}`
ICU-1052 redesign of engine to support supplemental characters X-SVN-Rev: 5340 2001-07-25 18:50:09 +00:00			`return U_MATCH;`
			`}`
			`if (incremental && offset == limit) {`
			`return U_PARTIAL_MATCH;`
			`}`
			`return U_MISMATCH;`
			`}`
ICU-1076 initial limited support for Kleene star and plus operators X-SVN-Rev: 5359 2001-07-27 00:18:53 +00:00
ICU-1264 added namspace support where possible. X-SVN-Rev: 6124 2001-10-08 23:26:58 +00:00			`U_NAMESPACE_END`

ICU-1076 initial limited support for Kleene star and plus operators X-SVN-Rev: 5359 2001-07-27 00:18:53 +00:00			`//eof`