ICU-3800 update tags for 3.0

X-SVN-Rev: 15669
This commit is contained in:
Doug Felt 2004-06-02 03:04:17 +00:00
parent 32e82c28af
commit a62522c77e
2 changed files with 1122 additions and 1041 deletions

File diff suppressed because it is too large Load Diff

View File

@ -28,33 +28,37 @@ package com.ibm.icu.lang;
*/
public interface UProperty
{
// public data member --------------------------------------------------
// public data member --------------------------------------------------
/**
* <p>Binary property Alphabetic. </p>
* <p>Property for UCharacter.isUAlphabetic(), different from the property
* in UCharacter.isalpha().</p>
* <p>Lu + Ll + Lt + Lm + Lo + Nl + Other_Alphabetic.</p>
/**
* <p>Binary property Alphabetic. </p>
* <p>Property for UCharacter.isUAlphabetic(), different from the property
* in UCharacter.isalpha().</p>
* <p>Lu + Ll + Lt + Lm + Lo + Nl + Other_Alphabetic.</p>
* @stable ICU 2.6
*/
*/
public static final int ALPHABETIC = 0;
/**
* First constant for binary Unicode properties.
* @stable ICU 2.6
*/
public static final int BINARY_START = ALPHABETIC;
/**
* Binary property ASCII_Hex_Digit (0-9 A-F a-f).
* @stable ICU 2.6
*/
public static final int ASCII_HEX_DIGIT = 1;
/**
* <p>Binary property Bidi_Control.</p>
* <p>Format controls which have specific functions in the Bidi Algorithm.
* </p>
* @stable ICU 2.6
*/
public static final int BIDI_CONTROL = 2;
public static final int BIDI_CONTROL = 2;
/**
* <p>Binary property Bidi_Mirrored.</p>
* <p>Characters that may change display in RTL text.</p>
@ -63,12 +67,14 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int BIDI_MIRRORED = 3;
/**
* <p>Binary property Dash.</p>
* <p>Variations of dashes.</p>
* @stable ICU 2.6
*/
public static final int DASH = 4;
/**
* <p>Binary property Default_Ignorable_Code_Point (new).
* </p>
@ -79,12 +85,14 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int DEFAULT_IGNORABLE_CODE_POINT = 5;
/**
* <p>Binary property Deprecated (new).</p>
* <p>The usage of deprecated characters is strongly discouraged.</p>
* @stable ICU 2.6
*/
public static final int DEPRECATED = 6;
/**
* <p>Binary property Diacritic.</p>
* <p>Characters that linguistically modify the meaning of another
@ -92,6 +100,7 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int DIACRITIC = 7;
/**
* <p>Binary property Extender.</p>
* <p>Extend the value or shape of a preceding alphabetic character, e.g.
@ -99,6 +108,7 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int EXTENDER = 8;
/**
* <p>Binary property Full_Composition_Exclusion.</p>
* <p>CompositionExclusions.txt + Singleton Decompositions +
@ -106,6 +116,7 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int FULL_COMPOSITION_EXCLUSION = 9;
/**
* <p>Binary property Grapheme_Base (new).</p>
* <p>For programmatic determination of grapheme cluster boundaries.
@ -113,6 +124,7 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int GRAPHEME_BASE = 10;
/**
* <p>Binary property Grapheme_Extend (new).</p>
* <p>For programmatic determination of grapheme cluster boundaries.</p>
@ -120,18 +132,21 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int GRAPHEME_EXTEND = 11;
/**
* <p>Binary property Grapheme_Link (new).</p>
* <p>For programmatic determination of grapheme cluster boundaries.</p>
* @stable ICU 2.6
*/
public static final int GRAPHEME_LINK = 12;
/**
* <p>Binary property Hex_Digit.</p>
* <p>Characters commonly used for hexadecimal numbers.</p>
* @stable ICU 2.6
*/
public static final int HEX_DIGIT = 13;
/**
* <p>Binary property Hyphen.</p>
* <p>Dashes used to mark connections between pieces of words, plus the
@ -139,6 +154,7 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int HYPHEN = 14;
/**
* <p>Binary property ID_Continue.</p>
* <p>Characters that can continue an identifier.</p>
@ -146,6 +162,7 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int ID_CONTINUE = 15;
/**
* <p>Binary property ID_Start.</p>
* <p>Characters that can start an identifier.</p>
@ -153,12 +170,14 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int ID_START = 16;
/**
* <p>Binary property Ideographic.</p>
* <p>CJKV ideographs.</p>
* @stable ICU 2.6
*/
public static final int IDEOGRAPHIC = 17;
/**
* <p>Binary property IDS_Binary_Operator (new).</p>
* <p>For programmatic determination of Ideographic Description Sequences.
@ -166,6 +185,7 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int IDS_BINARY_OPERATOR = 18;
/**
* <p>Binary property IDS_Trinary_Operator (new).</p>
* <p?For programmatic determination of Ideographic Description
@ -173,12 +193,14 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int IDS_TRINARY_OPERATOR = 19;
/**
* <p>Binary property Join_Control.</p>
* <p>Format controls for cursive joining and ligation.</p>
* @stable ICU 2.6
*/
public static final int JOIN_CONTROL = 20;
/**
* <p>Binary property Logical_Order_Exception (new).</p>
* <p>Characters that do not use logical order and require special
@ -186,6 +208,7 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int LOGICAL_ORDER_EXCEPTION = 21;
/**
* <p>Binary property Lowercase.</p>
* <p>Same as UCharacter.isULowercase(), different from
@ -194,11 +217,13 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int LOWERCASE = 22;
/** <p>Binary property Math.</p>
* <p>Sm+Other_Math</p>
* @stable ICU 2.6
*/
public static final int MATH = 23;
/**
* <p>Binary property Noncharacter_Code_Point.</p>
* <p>Code points that are explicitly defined as illegal for the encoding
@ -206,11 +231,13 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int NONCHARACTER_CODE_POINT = 24;
/**
* <p>Binary property Quotation_Mark.</p>
* @stable ICU 2.6
*/
public static final int QUOTATION_MARK = 25;
/**
* <p>Binary property Radical (new).</p>
* <p>For programmatic determination of Ideographic Description
@ -218,6 +245,7 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int RADICAL = 26;
/**
* <p>Binary property Soft_Dotted (new).</p>
* <p>Characters with a "soft dot", like i or j.</p>
@ -225,6 +253,7 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int SOFT_DOTTED = 27;
/**
* <p>Binary property Terminal_Punctuation.</p>
* <p>Punctuation characters that generally mark the end of textual
@ -232,6 +261,7 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int TERMINAL_PUNCTUATION = 28;
/**
* <p>Binary property Unified_Ideograph (new).</p>
* <p>For programmatic determination of Ideographic Description
@ -239,6 +269,7 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int UNIFIED_IDEOGRAPH = 29;
/**
* <p>Binary property Uppercase.</p>
* <p>Same as UCharacter.isUUppercase(), different from
@ -247,6 +278,7 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int UPPERCASE = 30;
/**
* <p>Binary property White_Space.</p>
* <p>Same as UCharacter.isUWhiteSpace(), different from
@ -255,6 +287,7 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int WHITE_SPACE = 31;
/**
* <p>Binary property XID_Continue.</p>
* <p>ID_Continue modified to allow closure under normalization forms
@ -262,6 +295,7 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int XID_CONTINUE = 32;
/**
* <p>Binary property XID_Start.</p>
* <p>ID_Start modified to allow closure under normalization forms NFKC
@ -269,6 +303,7 @@ public interface UProperty
* @stable ICU 2.6
*/
public static final int XID_START = 33;
/**
* <p>Binary property Case_Sensitive.</p>
* <p>Either the source of a case
@ -277,6 +312,7 @@ public interface UProperty
* @draft ICU 2.6
*/
public static final int CASE_SENSITIVE = 34;
/**
* Binary property STerm (new in Unicode 4.0.1).
* Sentence Terminal. Used in UAX #29: Text Boundaries
@ -284,6 +320,7 @@ public interface UProperty
* @draft ICU 3.0
*/
public static final int S_TERM = 35;
/**
* Binary property Variation_Selector (new in Unicode 4.0.1).
* Indicates all those characters that qualify as Variation Selectors.
@ -292,6 +329,7 @@ public interface UProperty
* @draft ICU 3.0
*/
public static final int VARIATION_SELECTOR = 36;
/** Binary property NFD_Inert.
ICU-specific property for characters that are inert under NFD,
i.e., they do not interact with adjacent characters.
@ -308,13 +346,14 @@ public interface UProperty
d) can never compose with a previous character.
e) can never compose with a following character.
f) can never change if another character is added.
Example: a-breve might satisfy all but f, but if you
add an ogonek it changes to a-ogonek + breve
Example: a-breve might satisfy all but f, but if you
add an ogonek it changes to a-ogonek + breve
See also com.ibm.text.UCD.NFSkippable in the ICU4J repository,
and icu/source/common/unormimp.h .
@draft ICU 3.0 */
public static final int NFD_INERT = 37;
/** Binary property NFKD_Inert.
ICU-specific property for characters that are inert under NFKD,
i.e., they do not interact with adjacent characters.
@ -324,6 +363,7 @@ public interface UProperty
@see #NFD_INERT
@draft ICU 3.0 */
public static final int NFKD_INERT = 38;
/** Binary property NFC_Inert.
ICU-specific property for characters that are inert under NFC,
i.e., they do not interact with adjacent characters.
@ -333,6 +373,7 @@ public interface UProperty
@see #NFD_INERT
@draft ICU 3.0 */
public static final int NFC_INERT = 39;
/** Binary property NFKC_Inert.
ICU-specific property for characters that are inert under NFKC,
i.e., they do not interact with adjacent characters.
@ -342,6 +383,7 @@ public interface UProperty
@see #NFD_INERT
@draft ICU 3.0 */
public static final int NFKC_INERT = 40;
/** Binary Property Segment_Starter.
ICU-specific property for characters that are starters in terms of
Unicode normalization and combining character sequences.
@ -353,6 +395,7 @@ public interface UProperty
processing collation tailoring rules.
@draft ICU 3.0 */
public static final int SEGMENT_STARTER = 41;
/**
* <p>One more than the last constant for binary Unicode properties.</p>
* @stable ICU 2.6
@ -362,74 +405,85 @@ public interface UProperty
/**
* Enumerated property Bidi_Class.
* Same as UCharacter.getDirection(int), returns UCharacterDirection values.
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int BIDI_CLASS = 0x1000;
/**
* First constant for enumerated/integer Unicode properties.
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int INT_START = BIDI_CLASS;
/**
* Enumerated property Block.
* Same as UCharacter.UnicodeBlock.of(int), returns UCharacter.UnicodeBlock
* values.
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int BLOCK = 0x1001;
/**
* Enumerated property Canonical_Combining_Class.
* Same as UCharacter.getCombiningClass(int), returns 8-bit numeric values.
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int CANONICAL_COMBINING_CLASS = 0x1002;
/**
* Enumerated property Decomposition_Type.
* Returns UCharacter.DecompositionType values.
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int DECOMPOSITION_TYPE = 0x1003;
/**
* Enumerated property East_Asian_Width.
* See http://www.unicode.org/reports/tr11/
* Returns UCharacter.EastAsianWidth values.
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int EAST_ASIAN_WIDTH = 0x1004;
/**
* Enumerated property General_Category.
* Same as UCharacter.getType(int), returns UCharacterCategory values.
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int GENERAL_CATEGORY = 0x1005;
/**
* Enumerated property Joining_Group.
* Returns UCharacter.JoiningGroup values.
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int JOINING_GROUP = 0x1006;
/**
* Enumerated property Joining_Type.
* Returns UCharacter.JoiningType values.
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int JOINING_TYPE = 0x1007;
/**
* Enumerated property Line_Break.
* Returns UCharacter.LineBreak values.
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int LINE_BREAK = 0x1008;
/**
* Enumerated property Numeric_Type.
* Returns UCharacter.NumericType values.
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int NUMERIC_TYPE = 0x1009;
/**
* Enumerated property Script.
* Same as UScript.getScript(int), returns UScript values.
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int SCRIPT = 0x100A;
@ -439,30 +493,35 @@ public interface UProperty
* @draft ICU 2.6
* */
public static final int HANGUL_SYLLABLE_TYPE = 0x100B;
/**
* Enumerated property NFD_Quick_Check.
* Returns numeric values compatible with Normalizer.QuickCheckResult.
* @draft ICU 3.0
*/
public static final int NFD_QUICK_CHECK = 0x100C;
/**
* Enumerated property NFKD_Quick_Check.
* Returns numeric values compatible with Normalizer.QuickCheckResult.
* @draft ICU 3.0
*/
public static final int NFKD_QUICK_CHECK = 0x100D;
/**
* Enumerated property NFC_Quick_Check.
* Returns numeric values compatible with Normalizer.QuickCheckResult.
* @draft ICU 3.0
*/
public static final int NFC_QUICK_CHECK = 0x100E;
/**
* Enumerated property NFKC_Quick_Check.
* Returns numeric values compatible with Normalizer.QuickCheckResult.
* @draft ICU 3.0
*/
public static final int NFKC_QUICK_CHECK = 0x100F;
/**
* Enumerated property Lead_Canonical_Combining_Class.
* ICU-specific property for the ccc of the first code point
@ -473,6 +532,7 @@ public interface UProperty
* @draft ICU 3.0
*/
public static final int LEAD_CANONICAL_COMBINING_CLASS = 0x1010;
/**
* Enumerated property Trail_Canonical_Combining_Class.
* ICU-specific property for the ccc of the last code point
@ -483,10 +543,11 @@ public interface UProperty
* @draft ICU 3.0
*/
public static final int TRAIL_CANONICAL_COMBINING_CLASS = 0x1011;
/**
* One more than the last constant for enumerated/integer Unicode
* properties.
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int INT_LIMIT = 0x1012;
@ -497,122 +558,141 @@ public interface UProperty
* returns bit masks for UCharacterCategory values where exactly one bit is set.
* When used with UCharacter.getPropertyValueName() and UCharacter.getPropertyValueEnum(),
* a multi-bit mask is used for sets of categories like "Letters".
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int GENERAL_CATEGORY_MASK = 0x2000;
/**
* First constant for bit-mask Unicode properties.
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int MASK_START = GENERAL_CATEGORY_MASK;
/**
* One more than the last constant for bit-mask Unicode properties.
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int MASK_LIMIT = 0x2001;
/**
* First constant for double Unicode properties.
* @draft ICU 2.4
*/
public static final int DOUBLE_START = 0x3000;
/**
* Double property Numeric_Value.
* Corresponds to UCharacter.getUnicodeNumericValue(int).
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int NUMERIC_VALUE = DOUBLE_START;
public static final int NUMERIC_VALUE = 0x3000;
/**
* First constant for double Unicode properties.
* @stable ICU 2.4
*/
public static final int DOUBLE_START = NUMERIC_VALUE;
/**
* One more than the last constant for double Unicode properties.
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int DOUBLE_LIMIT = 0x3001;
/**
* First constant for string Unicode properties.
* @draft ICU 2.4
*/
public static final int STRING_START = 0x4000;
/**
* String property Age.
* Corresponds to UCharacter.getAge(int).
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int AGE = STRING_START;
public static final int AGE = 0x4000;
/**
* First constant for string Unicode properties.
* @stable ICU 2.4
*/
public static final int STRING_START = AGE;
/**
* String property Bidi_Mirroring_Glyph.
* Corresponds to UCharacter.getMirror(int).
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int BIDI_MIRRORING_GLYPH = 0x4001;
/**
* String property Case_Folding.
* Corresponds to UCharacter.foldCase(String, boolean).
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int CASE_FOLDING = 0x4002;
/**
* String property ISO_Comment.
* Corresponds to UCharacter.getISOComment(int).
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int ISO_COMMENT = 0x4003;
/**
* String property Lowercase_Mapping.
* Corresponds to UCharacter.toLowerCase(String).
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int LOWERCASE_MAPPING = 0x4004;
/**
* String property Name.
* Corresponds to UCharacter.getName(int).
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int NAME = 0x4005;
/**
* String property Simple_Case_Folding.
* Corresponds to UCharacter.foldCase(int, boolean).
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int SIMPLE_CASE_FOLDING = 0x4006;
/**
* String property Simple_Lowercase_Mapping.
* Corresponds to UCharacter.toLowerCase(int).
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int SIMPLE_LOWERCASE_MAPPING = 0x4007;
/**
* String property Simple_Titlecase_Mapping.
* Corresponds to UCharacter.toTitleCase(int).
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int SIMPLE_TITLECASE_MAPPING = 0x4008;
/**
* String property Simple_Uppercase_Mapping.
* Corresponds to UCharacter.toUpperCase(int).
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int SIMPLE_UPPERCASE_MAPPING = 0x4009;
/**
* String property Titlecase_Mapping.
* Corresponds to UCharacter.toTitleCase(String).
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int TITLECASE_MAPPING = 0x400A;
/**
* String property Unicode_1_Name.
* Corresponds to UCharacter.getName1_0(int).
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int UNICODE_1_NAME = 0x400B;
/**
* String property Uppercase_Mapping.
* Corresponds to UCharacter.toUpperCase(String).
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int UPPERCASE_MAPPING = 0x400C;
/**
* One more than the last constant for string Unicode properties.
* @draft ICU 2.4
* @stable ICU 2.4
*/
public static final int STRING_LIMIT = 0x400D;
@ -627,28 +707,28 @@ public interface UProperty
*
* @see UCharacter#getPropertyName
* @see UCharacter#getPropertyValueName
* @draft ICU 2.4
* @stable ICU 2.4
*/
public interface NameChoice {
/**
* Selector for the abbreviated name of a property or value.
* Most properties and values have a short name; those that do
* not return null.
* @draft ICU 2.4
* @stable ICU 2.4
*/
static final int SHORT = 0;
/**
* Selector for the long name of a property or value. All
* properties and values have a long name.
* @draft ICU 2.4
* @stable ICU 2.4
*/
static final int LONG = 1;
/**
* The number of predefined property name choices. Individual
* properties or values may have more than COUNT aliases.
* @draft ICU 2.4
* @stable ICU 2.4
*/
static final int COUNT = 2;
}