2003-05-29 22:10:20 +00:00
|
|
|
/********************************************************************
|
|
|
|
* COPYRIGHT:
|
2003-06-03 20:58:22 +00:00
|
|
|
* Copyright (c) 1999-2003, International Business Machines Corporation and
|
2003-05-29 22:10:20 +00:00
|
|
|
* others. All Rights Reserved.
|
|
|
|
********************************************************************/
|
|
|
|
|
|
|
|
#include "unaccent.h"
|
|
|
|
|
|
|
|
const char UnaccentTransliterator::fgClassID = 0;
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Constructor
|
|
|
|
*/
|
|
|
|
UnaccentTransliterator::UnaccentTransliterator() :
|
|
|
|
normalizer("", UNORM_NFD),
|
|
|
|
Transliterator("Unaccent", 0) {
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Destructor
|
|
|
|
*/
|
|
|
|
UnaccentTransliterator::~UnaccentTransliterator() {
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Remove accents from a character using Normalizer.
|
|
|
|
*/
|
|
|
|
UChar UnaccentTransliterator::unaccent(UChar c) const {
|
|
|
|
UnicodeString str(c);
|
|
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
|
|
UnaccentTransliterator* t = (UnaccentTransliterator*)this;
|
|
|
|
|
|
|
|
t->normalizer.setText(str, status);
|
|
|
|
if (U_FAILURE(status)) {
|
|
|
|
return c;
|
|
|
|
}
|
|
|
|
return (UChar) t->normalizer.next();
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Implement Transliterator API
|
|
|
|
*/
|
|
|
|
void UnaccentTransliterator::handleTransliterate(Replaceable& text,
|
|
|
|
UTransPosition& index,
|
|
|
|
UBool incremental) const {
|
|
|
|
UnicodeString str("a");
|
|
|
|
while (index.start < index.limit) {
|
|
|
|
UChar c = text.charAt(index.start);
|
|
|
|
UChar d = unaccent(c);
|
|
|
|
if (c != d) {
|
|
|
|
str.setCharAt(0, d);
|
|
|
|
text.handleReplaceBetween(index.start, index.start+1, str);
|
|
|
|
}
|
|
|
|
index.start++;
|
|
|
|
}
|
|
|
|
}
|