2002-06-07 20:24:40 +00:00
|
|
|
/*
|
|
|
|
*****************************************************************
|
|
|
|
* Copyright (c) 2002, International Business Machines Corporation
|
|
|
|
* and others. All Rights Reserved.
|
|
|
|
*****************************************************************
|
|
|
|
* $Source: /xsrl/Nsvn/icu/icu/source/i18n/anytrans.h,v $
|
2002-09-20 01:54:48 +00:00
|
|
|
* $Revision: 1.4 $
|
2002-06-07 20:24:40 +00:00
|
|
|
*****************************************************************
|
|
|
|
* Date Name Description
|
|
|
|
* 06/06/2002 aliu Creation.
|
|
|
|
*****************************************************************
|
|
|
|
*/
|
|
|
|
#ifndef _ANYTRANS_H_
|
|
|
|
#define _ANYTRANS_H_
|
|
|
|
|
2002-09-20 01:54:48 +00:00
|
|
|
#include "unicode/utypes.h"
|
|
|
|
|
|
|
|
#if !UCONFIG_NO_TRANSLITERATION
|
|
|
|
|
2002-06-07 20:24:40 +00:00
|
|
|
#include "unicode/translit.h"
|
|
|
|
#include "unicode/uscript.h"
|
2002-06-11 22:36:11 +00:00
|
|
|
#include "uhash.h"
|
2002-06-07 20:24:40 +00:00
|
|
|
|
|
|
|
U_NAMESPACE_BEGIN
|
|
|
|
|
|
|
|
/**
|
2002-06-11 22:36:11 +00:00
|
|
|
* A transliterator named Any-T or Any-T/V, where T is the target
|
|
|
|
* script and V is the optional variant, that uses multiple
|
|
|
|
* transliterators, all going to T or T/V, all with script sources.
|
|
|
|
* The target must be a script. It partitions text into runs of the
|
|
|
|
* same script, and then based on the script of each run,
|
|
|
|
* transliterates from that script to the given target or
|
|
|
|
* target/variant. Adjacent COMMON or INHERITED script characters are
|
|
|
|
* included in each run.
|
2002-06-07 20:24:40 +00:00
|
|
|
*
|
|
|
|
* @author Alan Liu
|
|
|
|
*/
|
|
|
|
class U_I18N_API AnyTransliterator : public Transliterator {
|
|
|
|
|
|
|
|
/**
|
2002-06-11 22:36:11 +00:00
|
|
|
* Cache mapping UScriptCode values to Transliterator*.
|
2002-06-07 20:24:40 +00:00
|
|
|
*/
|
2002-06-11 22:36:11 +00:00
|
|
|
UHashtable* cache;
|
2002-06-07 20:24:40 +00:00
|
|
|
|
|
|
|
/**
|
2002-06-11 22:36:11 +00:00
|
|
|
* The target or target/variant string.
|
2002-06-07 20:24:40 +00:00
|
|
|
*/
|
2002-06-11 22:36:11 +00:00
|
|
|
UnicodeString target;
|
2002-06-07 20:24:40 +00:00
|
|
|
|
|
|
|
/**
|
2002-06-11 22:36:11 +00:00
|
|
|
* The target script code. Never USCRIPT_INVALID_CODE.
|
2002-06-07 20:24:40 +00:00
|
|
|
*/
|
2002-06-11 22:36:11 +00:00
|
|
|
UScriptCode targetScript;
|
2002-06-07 20:24:40 +00:00
|
|
|
|
2002-06-29 00:04:16 +00:00
|
|
|
/**
|
|
|
|
* The address of this static class variable serves as this class's ID
|
|
|
|
* for ICU "poor man's RTTI".
|
|
|
|
*/
|
|
|
|
static const char fgClassID;
|
|
|
|
|
2002-06-07 20:24:40 +00:00
|
|
|
public:
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Destructor.
|
|
|
|
*/
|
|
|
|
virtual ~AnyTransliterator();
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Copy constructor.
|
|
|
|
*/
|
|
|
|
AnyTransliterator(const AnyTransliterator&);
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Transliterator API.
|
|
|
|
*/
|
|
|
|
Transliterator* clone() const;
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Implements {@link Transliterator#handleTransliterate}.
|
|
|
|
*/
|
|
|
|
virtual void handleTransliterate(Replaceable& text, UTransPosition& index,
|
|
|
|
UBool incremental) const;
|
|
|
|
|
2002-06-29 00:04:16 +00:00
|
|
|
/**
|
|
|
|
* ICU "poor man's RTTI", returns a UClassID for the actual class.
|
|
|
|
*
|
|
|
|
* @draft ICU 2.2
|
|
|
|
*/
|
|
|
|
virtual inline UClassID getDynamicClassID() const { return getStaticClassID(); }
|
|
|
|
|
|
|
|
/**
|
|
|
|
* ICU "poor man's RTTI", returns a UClassID for this class.
|
|
|
|
*
|
|
|
|
* @draft ICU 2.2
|
|
|
|
*/
|
|
|
|
static inline UClassID getStaticClassID() { return (UClassID)&fgClassID; }
|
|
|
|
|
2002-06-07 20:24:40 +00:00
|
|
|
private:
|
|
|
|
|
|
|
|
/**
|
2002-06-11 22:36:11 +00:00
|
|
|
* Private constructor
|
|
|
|
* @param id the ID of the form S-T or S-T/V, where T is theTarget
|
|
|
|
* and V is theVariant. Must not be empty.
|
|
|
|
* @param theTarget the target name. Must not be empty, and must
|
|
|
|
* name a script corresponding to theTargetScript.
|
|
|
|
* @param theVariant the variant name, or the empty string if
|
|
|
|
* there is no variant
|
|
|
|
* @param theTargetScript the script code corresponding to
|
|
|
|
* theTarget.
|
|
|
|
* @param ec error code, fails if the internal hashtable cannot be
|
|
|
|
* allocated
|
2002-06-07 20:24:40 +00:00
|
|
|
*/
|
2002-06-11 22:36:11 +00:00
|
|
|
AnyTransliterator(const UnicodeString& id,
|
|
|
|
const UnicodeString& theTarget,
|
|
|
|
const UnicodeString& theVariant,
|
|
|
|
UScriptCode theTargetScript,
|
|
|
|
UErrorCode& ec);
|
2002-06-07 20:24:40 +00:00
|
|
|
|
|
|
|
/**
|
2002-06-11 22:36:11 +00:00
|
|
|
* Returns a transliterator from the given source to our target or
|
|
|
|
* target/variant. Returns NULL if the source is the same as our
|
|
|
|
* target script, or if the source is USCRIPT_INVALID_CODE.
|
|
|
|
* Caches the result and returns the same transliterator the next
|
|
|
|
* time. The caller does NOT own the result and must not delete
|
|
|
|
* it.
|
2002-06-07 20:24:40 +00:00
|
|
|
*/
|
2002-06-11 22:36:11 +00:00
|
|
|
Transliterator* getTransliterator(UScriptCode source) const;
|
|
|
|
|
2002-06-07 20:24:40 +00:00
|
|
|
/**
|
2002-06-11 22:36:11 +00:00
|
|
|
* Registers standard transliterators with the system. Called by
|
2002-06-07 20:24:40 +00:00
|
|
|
* Transliterator during initialization.
|
|
|
|
*/
|
|
|
|
static void registerIDs();
|
|
|
|
|
|
|
|
friend class Transliterator; // for registerIDs()
|
|
|
|
|
|
|
|
/**
|
2002-06-11 22:36:11 +00:00
|
|
|
* Return the script code for a given name, or
|
|
|
|
* USCRIPT_INVALID_CODE if not found.
|
2002-06-07 20:24:40 +00:00
|
|
|
*/
|
2002-06-11 22:36:11 +00:00
|
|
|
static UScriptCode scriptNameToCode(const UnicodeString& name);
|
2002-06-07 20:24:40 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
U_NAMESPACE_END
|
|
|
|
|
2002-09-20 01:54:48 +00:00
|
|
|
#endif /* #if !UCONFIG_NO_TRANSLITERATION */
|
|
|
|
|
2002-06-07 20:24:40 +00:00
|
|
|
#endif
|