Obsolete; use UnicodeSet

X-SVN-Rev: 1472
2000-05-24 21:12:59 +00:00 · 2000-05-24 21:12:59 +00:00 · 95a8ec6569
commit 95a8ec6569
parent 769118da39
1 changed files with 0 additions and 975 deletions
--- a/icu4j/src/com/ibm/text/CharSet.java
+++ b/icu4j/src/com/ibm/text/CharSet.java
@ -1,975 +0,0 @@
-/*
- *******************************************************************************
- * Copyright (C) 1996-2000, International Business Machines Corporation and    *
- * others. All Rights Reserved.                                                *
- *******************************************************************************
- *
- * $Source: /xsrl/Nsvn/icu/icu4j/src/com/ibm/text/Attic/CharSet.java,v $ 
- * $Date: 2000/03/10 04:07:18 $ 
- * $Revision: 1.2 $
- *
- *****************************************************************************************
- */
-package com.ibm.text;
-
-import java.util.Hashtable;
-
-/**
- * An object representing a set of characters.  (This is a "set" in the
- * mathematical sense: an unduplicated list of characters on which set
- * operations such as union and intersection can be performed.)  The
- * set information is stored in compressed, optimized form: The object
- * contains a String with an even number of characters.  Each pair of
- * characters represents a range of characters contained in the set
- * (a pair of the same character represents a single character).  The
- * characters are sorted in increasing order.
- */
-public class CharSet implements Cloneable {
-    /**
-     * The structure containing the set information.  The characters
-     * in this string are organized into pairs, each pair representing
-     * a range of characters contained in the set
-     */
-    private String chars;
-
-    //==========================================================================
-    // parseString() and associated routines
-    //==========================================================================
-    /**
-     * A cache which is used to speed up parseString() whenever it is
-     * used to parse a description that has been parsed before
-     */
-    private static Hashtable expressionCache = null;
-
-    /**
-     * Builds a CharSet based on a textual description.  For the syntax of
-     * the description, see the documentation of RuleBasedBreakIterator.
-     * @see com.ibm.text.RuleBasedBreakIterator
-     */
-    public static CharSet parseString(String s) {
-        CharSet result = null;
-
-        // if "s" is in the expression cache, pull the result out
-        // of the expresison cache
-        if (expressionCache != null) {
-            result = (CharSet)expressionCache.get(s);
-        }
-
-        // otherwise, use doParseString() to actually parse the string,
-        // and then add a corresponding entry to the expression cache
-        if (result == null) {
-            result = doParseString(s);
-            if (expressionCache == null) {
-                expressionCache = new Hashtable();
-            }
-            expressionCache.put(s, result);
-        }
-        result = (CharSet)(result.clone());
-        return result;
-    }
-
-    /**
-     * This function is used by parseString() to actually parse the string
-     */
-    private static CharSet doParseString(String s) {
-        CharSet result = new CharSet();
-        int p = 0;
-
-        boolean haveDash = false;
-        boolean haveTilde = false;
-        boolean wIsReal = false;
-        char w = '\u0000';
-
-        // for each character in the description...
-        while (p < s.length()) {
-            char c = s.charAt(p);
-
-            // if it's an opening bracket...
-            if (c == '[') {
-                // flush the single-character cache
-                if (wIsReal) {
-                    result.internalUnion(new CharSet(w));
-                }
-
-                // locate the matching closing bracket
-                int bracketLevel = 1;
-                int q = p + 1;
-                while (bracketLevel != 0) {
-                    if (s.charAt(q) == '[') {
-                        ++bracketLevel;
-                    }
-                    else if (s.charAt(q) == ']') {
-                        --bracketLevel;
-                    }
-                    ++q;
-                }
-                --q;
-
-                // call parseString() recursively to parse the text inside
-                // the brackets, then either add or subtract the result from
-                // our running result depending on whether or not the []
-                // expresison was preceded by a ^
-                if (!haveTilde) {
-                    result.internalUnion(CharSet.parseString(s.substring(p + 1, q)));
-                }
-                else {
-                    result.internalDifference(CharSet.parseString(s.substring(p + 1, q)));
-                }
-                haveTilde = false;
-                haveDash = false;
-                wIsReal = false;
-                p = q + 1;
-            }
-
-            // if the character is a colon...
-            else if (c == ':') {
-                // flush the single-character cache
-                if (wIsReal) {
-                    result.internalUnion(new CharSet(w));
-                }
-
-                // locate the matching colon (and throw an error if there
-                // isn't one)
-                int q = s.indexOf(':', p + 1);
-                if (q == -1) {
-                    throw new IllegalArgumentException("Parse error at position " + p + " in " + s);
-                }
-
-                // use charSetForCategory() to parse the text in the colons,
-                // and either add or substract the result from our running
-                // result depending on whether the :: expression was
-                // preceded by a ^
-                if (!haveTilde) {
-                    result.internalUnion(charSetForCategory(s.substring(p + 1, q)));
-                }
-                else {
-                    result.internalDifference(charSetForCategory(s.substring(p + 1, q)));
-                }
-
-                // reset everything and advance to the next character
-                haveTilde = false;
-                haveDash = false;
-                wIsReal = false;
-                p = q + 1;
-            }
-
-            // if the character is a dash, set an appropriate flag
-            else if (c == '-') {
-                if (wIsReal) {
-                    haveDash = true;
-                }
-                ++p;
-            }
-
-            // if the character is a caret, flush the single-character
-            // cache and set an appropriate flag.  If the set is empty
-            // (i.e., if the expression begins with ^), invert the set
-            // (i.e., set it to include everything).  The idea here is
-            // that a set that includes nothing but ^ expressions
-            // means "everything but these things".
-            else if (c == '^') {
-                if (wIsReal) {
-                    result.internalUnion(new CharSet(w));
-                    wIsReal = false;
-                }
-                haveTilde = true;
-                ++p;
-                if (result.empty()) {
-                    result.internalComplement();
-                }
-            }
-
-            // throw an exception on an illegal character
-            else if (c >= ' ' && c < '\u007f' && !Character.isLetter(c)
-                     && !Character.isDigit(c) && c != '\\') {
-                throw new IllegalArgumentException("Parse error at position " + p + " in " + s);
-            }
-
-            // otherwise, we end up here...
-            else {
-                // on a backslash, advance to the next character
-                if (c == '\\') {
-                    ++p;
-                }
-
-                // if the preceding character was a dash, this character
-                // defines the end of a range.  Add or subtract that range
-                // from the running result depending on whether or not it
-                // was preceded by a ^
-                if (haveDash) {
-                    if (s.charAt(p) < w) {
-                        throw new IllegalArgumentException("U+" + Integer.toHexString(s.charAt(p))
-                            + " is less than U+" + Integer.toHexString(w) + ".  Dash expressions "
-                            + "can't have their endpoints in reverse order.");
-                    }
-
-                    if (!haveTilde) {
-                        result.internalUnion(new CharSet(w, s.charAt(p++)));
-                    }
-                    else {
-                        result.internalDifference(new CharSet(w, s.charAt(p++)));
-                    }
-                    haveDash = false;
-                    haveTilde = false;
-                    wIsReal = false;
-                }
-
-                // if the preceding character was a caret, remove this character
-                // from the running result
-                else if (haveTilde) {
-                    result.internalDifference(new CharSet(s.charAt(p++)));
-                    haveTilde = false;
-                    wIsReal = false;
-                }
-
-                // otherwise, flush the single-character cache and then
-                // put this character into the cache
-                else if (wIsReal) {
-                    result.internalUnion(new CharSet(w));
-                    w = s.charAt(p++);
-                    wIsReal = true;
-                }
-                else {
-                    w = s.charAt(p++);
-                    wIsReal = true;
-                }
-            }
-        }
-
-        // finally, flush the single-character cache one last time
-        if (wIsReal) {
-            result.internalUnion(new CharSet(w));
-        }
-
-        return result;
-    }
-
-    /**
-     * Creates a CharSet containing all the characters in a particular
-     * Unicode category.  The text is either a two-character code from
-     * the Unicode database or a single character that begins one or more
-     * two-character codes.
-     */
-    private static CharSet charSetForCategory(String category) {
-        // throw an exception if we have anything other than one or two
-        // characters inside the colons
-        if (category.length() == 0 || category.length() >= 3) {
-            throw new IllegalArgumentException("Invalid character category: " + category);
-        }
-
-        // if we have two characters, search the category map for that code
-        // and either construct and return a CharSet from the data in the
-        // category map or throw an exception
-        if (category.length() == 2) {
-            for (int i = 0; i < categoryMap.length; i++) {
-                if (categoryMap[i][0].equals(category)) {
-                    return new CharSet(categoryMap[i][1]);
-                }
-            }
-            throw new IllegalArgumentException("Invalid character category: " + category);
-        }
-
-        // if we have one character, search the category map for codes beginning
-        // with that letter, and union together all of the matching sets that
-        // we find (or throw an exception if there are no matches)
-        else if (category.length() == 1) {
-            CharSet result = new CharSet();
-            for (int i = 0; i < categoryMap.length; i++) {
-                if (categoryMap[i][0].startsWith(category)) {
-                    result = result.union(new CharSet(categoryMap[i][1]));
-                }
-            }
-            if (result.empty()) {
-                throw new IllegalArgumentException("Invalid character category: " + category);
-            }
-            else {
-                return result;
-            }
-        }
-        return new CharSet(); // should never get here, but to make the compiler happy...
-    }
-
-    /**
-     * Returns a copy of CharSet's expression cache and sets CharSet's
-     * expression cache to empty.
-     */
-    public static Hashtable releaseExpressionCache() {
-        Hashtable result = expressionCache;
-        expressionCache = null;
-        return result;
-    }
-
-    //==========================================================================
-    // CharSet manipulation
-    //==========================================================================
-    /**
-     * Creates an empty CharSet.
-     */
-    public CharSet() {
-        chars = "";
-    }
-
-    /**
-     * Creates a CharSet containing a single character.
-     * @param c The character to put into the CharSet
-     */
-    public CharSet(char c) {
-        StringBuffer temp = new StringBuffer();
-        temp.append(c);
-        temp.append(c);
-        chars = temp.toString();
-    }
-
-    /**
-     * Creates a CharSet containing a range of characters.
-     * @param lo The lowest-numbered character to include in the range
-     * @param hi The highest-numbered character to include in the range
-     */
-    public CharSet(char lo, char hi) {
-        StringBuffer temp = new StringBuffer();
-        if (lo <= hi) {
-            temp.append(lo);
-            temp.append(hi);
-        }
-        else {
-            temp.append(hi);
-            temp.append(lo);
-        }
-        chars = temp.toString();
-    }
-
-    /**
-     * Creates a CharSet, initializing it from the internal storage
-     * of another CharSet (this function performs no error checking
-     * on "chars", so if it's malformed, undefined behavior will result)
-     */
-    private CharSet(String chars) {
-        this.chars = chars;
-    }
-
-    /**
-     * Returns a CharSet representing the union of two CharSets.
-     */
-    public CharSet union(CharSet that) {
-        return new CharSet(doUnion(that.chars).toString());
-    }
-
-    /**
-     * Adds the characters in "that" to this CharSet
-     */
-    private void internalUnion(CharSet that) {
-        chars = doUnion(that.chars).toString();
-    }
-
-    /**
-     * The actual implementation of the union functions
-     */
-    private StringBuffer doUnion(String c2) {
-        StringBuffer result = new StringBuffer();
-
-        int i = 0;
-        int j = 0;
-
-        // consider all the characters in both strings
-        while (i < chars.length() && j < c2.length()) {
-            char ub;
-
-            // the first character in the result is the lower of the
-            // starting characters of the two strings, and "ub" gets
-            // set to the upper bound of that range
-            if (chars.charAt(i) < c2.charAt(j)) {
-                result.append(chars.charAt(i));
-                ub = chars.charAt(++i);
-            }
-            else {
-                result.append(c2.charAt(j));
-                ub = c2.charAt(++j);
-            }
-
-            // for as long as one of our two pointers is pointing to a range's
-            // end point, or i is pointing to a character that is less than
-            // "ub" plus one (the "plus one" stitches touching ranges together)...
-            while (i % 2 == 1 ||
-                   j % 2 == 1 ||
-                   (i < chars.length() && chars.charAt(i) <= ub + 1)) {
-
-                // advance i to the first character that is greater than
-                // "ub" plus one
-                while (i < chars.length() && chars.charAt(i) <= ub + 1) {
-                    ++i;
-                }
-
-                // if i points to the endpoint of a range, update "ub"
-                // to that character, or if i points to the start of
-                // a range and the endpoint of the preceding range is
-                // greater than "ub", update "up" to _that_ character
-                if (i % 2 == 1) {
-                    ub = chars.charAt(i);
-                }
-                else if (i > 0 && chars.charAt(i - 1) > ub) {
-                    ub = chars.charAt(i - 1);
-                }
-
-                // now advance j to the first character that is greater
-                // that "ub" plus one
-                while (j < c2.length() && c2.charAt(j) <= ub + 1) {
-                    ++j;
-                }
-
-                // if j points to the endpoint of a range, update "ub"
-                // to that character, or if j points to the start of
-                // a range and the endpoint of the preceding range is
-                // greater than "ub", update "up" to _that_ character
-                if (j % 2 == 1) {
-                    ub = c2.charAt(j);
-                }
-                else if (j > 0 && c2.charAt(j - 1) > ub) {
-                    ub = c2.charAt(j - 1);
-                }
-            }
-            // when we finally fall out of this loop, we will have stitched
-            // together a series of ranges that overlap or touch, i and j
-            // will both point to starting points of ranges, and "ub" will
-            // be the endpoint of the range we're working on.  Write "ub"
-            // to the result
-            result.append(ub);
-
-        // loop back around to create the next range in the result
-        }
-
-        // we fall out to here when we've exhausted all the characters in
-        // one of the operands.  We can append all of the remaining characters
-        // in the other operand without doing any extra work.
-        if (i < chars.length()) {
-            result.append(chars.substring(i));
-        }
-        if (j < c2.length()) {
-            result.append(c2.substring(j));
-        }
-
-        return result;
-    }
-
-    /**
-     * Returns the intersection of two CharSets.
-     */
-    public CharSet intersection(CharSet that) {
-        return new CharSet(doIntersection(that.chars).toString());
-    }
-
-    /**
-     * Removes from this CharSet any characters that aren't also in "that"
-     */
-    private void internalIntersection(CharSet that) {
-        chars = doIntersection(that.chars).toString();
-    }
-
-    /**
-     * The internal implementation of the two intersection functions
-     */
-    private StringBuffer doIntersection(String c2) {
-        StringBuffer result = new StringBuffer();
-
-        int i = 0;
-        int j = 0;
-        int oldI;
-        int oldJ;
-
-        // iterate until we've exhausted one of the operands
-        while (i < chars.length() && j < c2.length()) {
-
-            // advance j until it points to a character that is larger than
-            // the one i points to.  If this is the beginning of a one-
-            // character range, advance j to point to the end
-            if (i < chars.length() && i % 2 == 0) {
-                while (j < c2.length() && c2.charAt(j) < chars.charAt(i)) {
-                    ++j;
-                }
-                if (j < c2.length() && j % 2 == 0 && c2.charAt(j) == chars.charAt(i)) {
-                    ++j;
-                }
-            }
-
-            // if j points to the endpoint of a range, save the current
-            // value of i, then advance i until it reaches a character
-            // which is larger than the character pointed at
-            // by j.  All of the characters we've advanced over (except
-            // the one currently pointed to by i) are added to the result
-            oldI = i;
-            while (j % 2 == 1 && i < chars.length() && chars.charAt(i) <= c2.charAt(j)) {
-                ++i;
-            }
-            result.append(chars.substring(oldI, i));
-
-            // if i points to the endpoint of a range, save the current
-            // value of j, then advance j until it reaches a character
-            // which is larger than the character pointed at
-            // by i.  All of the characters we've advanced over (except
-            // the one currently pointed to by i) are added to the result
-            oldJ = j;
-            while (i % 2 == 1 && j < c2.length() && c2.charAt(j) <= chars.charAt(i)) {
-                ++j;
-            }
-            result.append(c2.substring(oldJ, j));
-
-            // advance i until it points to a character larger than j
-            // If it points at the beginning of a one-character range,
-            // advance it to the end of that range
-            if (j < c2.length() && j % 2 == 0) {
-                while (i < chars.length() && chars.charAt(i) < c2.charAt(j)) {
-                    ++i;
-                }
-                if (i < chars.length() && i % 2 == 0 && c2.charAt(j) == chars.charAt(i)) {
-                    ++i;
-                }
-            }
-        }
-
-        return result;
-    }
-
-    /**
-     * Returns a CharSet containing all the characters in "this" that
-     * aren't also in "that"
-     */
-    public CharSet difference(CharSet that) {
-        return new CharSet(doIntersection(that.doComplement().toString()).toString());
-    }
-
-    /**
-     * Removes from "this" all the characters that are also in "that"
-     */
-    private void internalDifference(CharSet that) {
-        chars = doIntersection(that.doComplement().toString()).toString();
-    }
-
-    /**
-     * Returns a CharSet containing all the characters which are not
-     * in "this"
-     */
-    public CharSet complement() {
-        return new CharSet(doComplement().toString());
-    }
-
-    /**
-     * Complements "this".  All the characters it contains are removed,
-     * and all the characters it doesn't contain are added.
-     */
-    private void internalComplement() {
-        chars = doComplement().toString();
-    }
-
-    /**
-     * The internal implementation function for the complement routines
-     */
-    private StringBuffer doComplement() {
-        // the complement of an empty CharSet is one containing everything
-        if (empty()) {
-            return new StringBuffer("\u0000\uffff");
-        }
-
-        StringBuffer result = new StringBuffer();
-
-        int i = 0;
-
-        // the result begins with \u0000 unless the original CharSet does
-        if (chars.charAt(0) != '\u0000') {
-            result.append('\u0000');
-        }
-
-        // walk through the characters in this CharSet.  Append a pair of
-        // characters the first of which is one less than the first
-        // character we see and the second of which is one plus the second
-        // character we see (don't write the first character if it's \u0000,
-        // and don't write the second character if it's \uffff.
-        while (i < chars.length()) {
-            if (chars.charAt(i) != '\u0000') {
-                result.append((char)(chars.charAt(i) - 1));
-            }
-            if (chars.charAt(i + 1) != '\uffff') {
-                result.append((char)(chars.charAt(i + 1) + 1));
-            }
-            i += 2;
-        }
-
-        // add \uffff to the end of the result, unless it was in
-        // the original set
-        if (chars.charAt(chars.length() - 1) != '\uffff') {
-            result.append('\uffff');
-        }
-
-        return result;
-    }
-
-    /**
-     * Returns true if this CharSet contains the specified character
-     * @param c The character we're testing for set membership
-     */
-    public boolean contains(char c) {
-        // search for the first range endpoint that is greater than or
-        // equal to c
-        int i = 1;
-        while (i < chars.length() && chars.charAt(i) < c) {
-            i += 2;
-        }
-
-        // if we've walked off the end, we don't contain c
-        if (i == chars.length()) {
-            return false;
-        }
-
-        // otherwise, we contain c if the beginning of the range is less
-        // than or equal to c
-        return chars.charAt(i - 1) <= c;
-    }
-
-    /**
-     * Returns true if "that" is another instance of CharSet containing
-     * the exact same characters as this one
-     */
-    public boolean equals(Object that) {
-        return (that instanceof CharSet) && chars.equals(((CharSet)that).chars);
-    }
-
-    /**
-     * Creates a new CharSet that is equal to this one
-     */
-    public Object clone() {
-        return new CharSet(chars);
-    }
-
-    /**
-     * Returns true if this CharSet contains no characters
-     */
-    public boolean empty() {
-        return chars.length() == 0;
-    }
-
-    /**
-     * Returns a textual representation of this CharSet.  If the result
-     * of calling this function is passed to CharSet.parseString(), it
-     * will produce another CharSet that is equal to this one.
-     */
-    public String toString() {
-        StringBuffer result = new StringBuffer();
-
-        // the result begins with an opening bracket
-        result.append('[');
-
-        // iterate through the ranges in the CharSet
-        for (int i = 0; i < chars.length(); i += 2) {
-            // for a range with the same beginning and ending point,
-            // output that character
-            if (chars.charAt(i) == chars.charAt(i + 1)) {
-                result.append(chars.charAt(i));
-            }
-
-            // otherwise, output the start and end points of the range
-            // separated by a dash
-            else {
-                result.append(chars.charAt(i) + "-" + chars.charAt(i + 1));
-            }
-        }
-
-        // the result ends with a closing bracket
-        result.append(']');
-        return result.toString();
-    }
-
-    /**
-     * Returns a String representing the contents of this CharSet
-     * in the same form in which they're stored internally: as pairs
-     * of characters representing the start and end points of ranges
-     */
-    public String getRanges() {
-        return chars;
-    }
-
-    /**
-     * Returns an Enumeration that will return the ranges of characters
-     * contained in this CharSet one at a time
-     */
-    public Enumeration getChars() {
-        return new Enumeration(this);
-    }
-
-    //==========================================================================
-    // CharSet.Enumeration
-    //==========================================================================
-
-    /**
-     * An Enumeration that can be used to extract the character ranges
-     * from a CharSet one at a time
-     */
-    public class Enumeration implements java.util.Enumeration {
-        /**
-         * Initializes a CharSet.Enumeration
-         */
-        Enumeration(CharSet cs) {
-            this.chars = cs.chars;
-            p = 0;
-        }
-
-        /**
-         * Returns true if the enumeration hasn't yet returned
-         * all the ranges in the CharSet
-         */
-        public boolean hasMoreElements() {
-            return p < chars.length();
-        }
-
-        /**
-         * Returns the next range in the CarSet
-         */
-        public Object nextElement() {
-            char[] result = new char[2];
-            result[0] = chars.charAt(p);
-            result[1] = chars.charAt(p + 1);
-            p += 2;
-
-            return result;
-        }
-
-        int p;
-        String chars;
-    }
-
-    //==========================================================================
-    // tables for charSetForCategory()
-    //==========================================================================
-
-    /**
-     * Table used with charSetFromCategory.  This is an array of pairs
-     * of Strings.  The first column of Strings is Unicode character category
-     * codes as defined in the Unicode database.  The second column is the
-     * internal storage for a CharSet containing the characters in that
-     * category.
-     */
-    private static final String[][] categoryMap = {
-        { "Ll", "az\u00AA\u00AA\u00B5\u00B5\u00BA\u00BA\u00DF\u00F6\u00F8\u00FF\u0101\u0101"
-          + "\u0103\u0103\u0105\u0105\u0107\u0107\u0109\u0109\u010B\u010B\u010D\u010D"
-          + "\u010F\u010F\u0111\u0111\u0113\u0113\u0115\u0115\u0117\u0117\u0119\u0119"
-          + "\u011B\u011B\u011D\u011D\u011F\u011F\u0121\u0121\u0123\u0123\u0125\u0125"
-          + "\u0127\u0127\u0129\u0129\u012B\u012B\u012D\u012D\u012F\u012F\u0131\u0131"
-          + "\u0133\u0133\u0135\u0135\u0137\u0138\u013A\u013A\u013C\u013C\u013E\u013E"
-          + "\u0140\u0140\u0142\u0142\u0144\u0144\u0146\u0146\u0148\u0149\u014B\u014B"
-          + "\u014D\u014D\u014F\u014F\u0151\u0151\u0153\u0153\u0155\u0155\u0157\u0157"
-          + "\u0159\u0159\u015B\u015B\u015D\u015D\u015F\u015F\u0161\u0161\u0163\u0163"
-          + "\u0165\u0165\u0167\u0167\u0169\u0169\u016B\u016B\u016D\u016D\u016F\u016F"
-          + "\u0171\u0171\u0173\u0173\u0175\u0175\u0177\u0177\u017A\u017A\u017C\u017C"
-          + "\u017E\u0180\u0183\u0183\u0185\u0185\u0188\u0188\u018C\u018D\u0192\u0192"
-          + "\u0195\u0195\u0199\u019B\u019E\u019E\u01A1\u01A1\u01A3\u01A3\u01A5\u01A5"
-          + "\u01A8\u01A8\u01AB\u01AB\u01AD\u01AD\u01B0\u01B0\u01B4\u01B4\u01B6\u01B6"
-          + "\u01B9\u01BA\u01BD\u01BD\u01C6\u01C6\u01C9\u01C9\u01CC\u01CC\u01CE\u01CE"
-          + "\u01D0\u01D0\u01D2\u01D2\u01D4\u01D4\u01D6\u01D6\u01D8\u01D8\u01DA\u01DA"
-          + "\u01DC\u01DD\u01DF\u01DF\u01E1\u01E1\u01E3\u01E3\u01E5\u01E5\u01E7\u01E7"
-          + "\u01E9\u01E9\u01EB\u01EB\u01ED\u01ED\u01EF\u01F0\u01F3\u01F3\u01F5\u01F5"
-          + "\u01FB\u01FB\u01FD\u01FD\u01FF\u01FF\u0201\u0201\u0203\u0203\u0205\u0205"
-          + "\u0207\u0207\u0209\u0209\u020B\u020B\u020D\u020D\u020F\u020F\u0211\u0211"
-          + "\u0213\u0213\u0215\u0215\u0217\u0217\u0250\u02A8\u0390\u0390\u03AC\u03CE"
-          + "\u03D0\u03D1\u03D5\u03D6\u03E3\u03E3\u03E5\u03E5\u03E7\u03E7\u03E9\u03E9"
-          + "\u03EB\u03EB\u03ED\u03ED\u03EF\u03F2\u0430\u044F\u0451\u045C\u045E\u045F"
-          + "\u0461\u0461\u0463\u0463\u0465\u0465\u0467\u0467\u0469\u0469\u046B\u046B"
-          + "\u046D\u046D\u046F\u046F\u0471\u0471\u0473\u0473\u0475\u0475\u0477\u0477"
-          + "\u0479\u0479\u047B\u047B\u047D\u047D\u047F\u047F\u0481\u0481\u0491\u0491"
-          + "\u0493\u0493\u0495\u0495\u0497\u0497\u0499\u0499\u049B\u049B\u049D\u049D"
-          + "\u049F\u049F\u04A1\u04A1\u04A3\u04A3\u04A5\u04A5\u04A7\u04A7\u04A9\u04A9"
-          + "\u04AB\u04AB\u04AD\u04AD\u04AF\u04AF\u04B1\u04B1\u04B3\u04B3\u04B5\u04B5"
-          + "\u04B7\u04B7\u04B9\u04B9\u04BB\u04BB\u04BD\u04BD\u04BF\u04BF\u04C2\u04C2"
-          + "\u04C4\u04C4\u04C8\u04C8\u04CC\u04CC\u04D1\u04D1\u04D3\u04D3\u04D5\u04D5"
-          + "\u04D7\u04D7\u04D9\u04D9\u04DB\u04DB\u04DD\u04DD\u04DF\u04DF\u04E1\u04E1"
-          + "\u04E3\u04E3\u04E5\u04E5\u04E7\u04E7\u04E9\u04E9\u04EB\u04EB\u04EF\u04EF"
-          + "\u04F1\u04F1\u04F3\u04F3\u04F5\u04F5\u04F9\u04F9\u0561\u0587\u10D0\u10F6"
-          + "\u1E01\u1E01\u1E03\u1E03\u1E05\u1E05\u1E07\u1E07\u1E09\u1E09\u1E0B\u1E0B"
-          + "\u1E0D\u1E0D\u1E0F\u1E0F\u1E11\u1E11\u1E13\u1E13\u1E15\u1E15\u1E17\u1E17"
-          + "\u1E19\u1E19\u1E1B\u1E1B\u1E1D\u1E1D\u1E1F\u1E1F\u1E21\u1E21\u1E23\u1E23"
-          + "\u1E25\u1E25\u1E27\u1E27\u1E29\u1E29\u1E2B\u1E2B\u1E2D\u1E2D\u1E2F\u1E2F"
-          + "\u1E31\u1E31\u1E33\u1E33\u1E35\u1E35\u1E37\u1E37\u1E39\u1E39\u1E3B\u1E3B"
-          + "\u1E3D\u1E3D\u1E3F\u1E3F\u1E41\u1E41\u1E43\u1E43\u1E45\u1E45\u1E47\u1E47"
-          + "\u1E49\u1E49\u1E4B\u1E4B\u1E4D\u1E4D\u1E4F\u1E4F\u1E51\u1E51\u1E53\u1E53"
-          + "\u1E55\u1E55\u1E57\u1E57\u1E59\u1E59\u1E5B\u1E5B\u1E5D\u1E5D\u1E5F\u1E5F"
-          + "\u1E61\u1E61\u1E63\u1E63\u1E65\u1E65\u1E67\u1E67\u1E69\u1E69\u1E6B\u1E6B"
-          + "\u1E6D\u1E6D\u1E6F\u1E6F\u1E71\u1E71\u1E73\u1E73\u1E75\u1E75\u1E77\u1E77"
-          + "\u1E79\u1E79\u1E7B\u1E7B\u1E7D\u1E7D\u1E7F\u1E7F\u1E81\u1E81\u1E83\u1E83"
-          + "\u1E85\u1E85\u1E87\u1E87\u1E89\u1E89\u1E8B\u1E8B\u1E8D\u1E8D\u1E8F\u1E8F"
-          + "\u1E91\u1E91\u1E93\u1E93\u1E95\u1E9B\u1EA1\u1EA1\u1EA3\u1EA3\u1EA5\u1EA5"
-          + "\u1EA7\u1EA7\u1EA9\u1EA9\u1EAB\u1EAB\u1EAD\u1EAD\u1EAF\u1EAF\u1EB1\u1EB1"
-          + "\u1EB3\u1EB3\u1EB5\u1EB5\u1EB7\u1EB7\u1EB9\u1EB9\u1EBB\u1EBB\u1EBD\u1EBD"
-          + "\u1EBF\u1EBF\u1EC1\u1EC1\u1EC3\u1EC3\u1EC5\u1EC5\u1EC7\u1EC7\u1EC9\u1EC9"
-          + "\u1ECB\u1ECB\u1ECD\u1ECD\u1ECF\u1ECF\u1ED1\u1ED1\u1ED3\u1ED3\u1ED5\u1ED5"
-          + "\u1ED7\u1ED7\u1ED9\u1ED9\u1EDB\u1EDB\u1EDD\u1EDD\u1EDF\u1EDF\u1EE1\u1EE1"
-          + "\u1EE3\u1EE3\u1EE5\u1EE5\u1EE7\u1EE7\u1EE9\u1EE9\u1EEB\u1EEB\u1EED\u1EED"
-          + "\u1EEF\u1EEF\u1EF1\u1EF1\u1EF3\u1EF3\u1EF5\u1EF5\u1EF7\u1EF7\u1EF9\u1EF9"
-          + "\u1F00\u1F07\u1F10\u1F15\u1F20\u1F27\u1F30\u1F37\u1F40\u1F45\u1F50\u1F57"
-          + "\u1F60\u1F67\u1F70\u1F7D\u1F80\u1F87\u1F90\u1F97\u1FA0\u1FA7\u1FB0\u1FB4"
-          + "\u1FB6\u1FB7\u1FC2\u1FC4\u1FC6\u1FC7\u1FD0\u1FD3\u1FD6\u1FD7\u1FE0\u1FE7"
-          + "\u1FF2\u1FF4\u1FF6\u1FF7\u207F\u207F\u210A\u210A\u210E\u210F\u2113\u2113"
-          + "\u212E\u212F\u2134\u2134\uFB00\uFB06\uFB13\uFB17\uFF41\uFF5A" },
-        { "Lu", "AZ\u00C0\u00D6\u00D8\u00DE\u0100\u0100\u0102\u0102\u0104\u0104\u0106\u0106"
-          + "\u0108\u0108\u010A\u010A\u010C\u010C\u010E\u010E\u0110\u0110\u0112\u0112"
-          + "\u0114\u0114\u0116\u0116\u0118\u0118\u011A\u011A\u011C\u011C\u011E\u011E"
-          + "\u0120\u0120\u0122\u0122\u0124\u0124\u0126\u0126\u0128\u0128\u012A\u012A"
-          + "\u012C\u012C\u012E\u012E\u0130\u0130\u0132\u0132\u0134\u0134\u0136\u0136"
-          + "\u0139\u0139\u013B\u013B\u013D\u013D\u013F\u013F\u0141\u0141\u0143\u0143"
-          + "\u0145\u0145\u0147\u0147\u014A\u014A\u014C\u014C\u014E\u014E\u0150\u0150"
-          + "\u0152\u0152\u0154\u0154\u0156\u0156\u0158\u0158\u015A\u015A\u015C\u015C"
-          + "\u015E\u015E\u0160\u0160\u0162\u0162\u0164\u0164\u0166\u0166\u0168\u0168"
-          + "\u016A\u016A\u016C\u016C\u016E\u016E\u0170\u0170\u0172\u0172\u0174\u0174"
-          + "\u0176\u0176\u0178\u0179\u017B\u017B\u017D\u017D\u0181\u0182\u0184\u0184"
-          + "\u0186\u0187\u0189\u018B\u018E\u0191\u0193\u0194\u0196\u0198\u019C\u019D"
-          + "\u019F\u01A0\u01A2\u01A2\u01A4\u01A4\u01A6\u01A7\u01A9\u01A9\u01AC\u01AC"
-          + "\u01AE\u01AF\u01B1\u01B3\u01B5\u01B5\u01B7\u01B8\u01BC\u01BC\u01C4\u01C4"
-          + "\u01C7\u01C7\u01CA\u01CA\u01CD\u01CD\u01CF\u01CF\u01D1\u01D1\u01D3\u01D3"
-          + "\u01D5\u01D5\u01D7\u01D7\u01D9\u01D9\u01DB\u01DB\u01DE\u01DE\u01E0\u01E0"
-          + "\u01E2\u01E2\u01E4\u01E4\u01E6\u01E6\u01E8\u01E8\u01EA\u01EA\u01EC\u01EC"
-          + "\u01EE\u01EE\u01F1\u01F1\u01F4\u01F4\u01FA\u01FA\u01FC\u01FC\u01FE\u01FE"
-          + "\u0200\u0200\u0202\u0202\u0204\u0204\u0206\u0206\u0208\u0208\u020A\u020A"
-          + "\u020C\u020C\u020E\u020E\u0210\u0210\u0212\u0212\u0214\u0214\u0216\u0216"
-          + "\u0386\u0386\u0388\u038A\u038C\u038C\u038E\u038F\u0391\u03A1\u03A3\u03AB"
-          + "\u03D2\u03D4\u03DA\u03DA\u03DC\u03DC\u03DE\u03DE\u03E0\u03E0\u03E2\u03E2"
-          + "\u03E4\u03E4\u03E6\u03E6\u03E8\u03E8\u03EA\u03EA\u03EC\u03EC\u03EE\u03EE"
-          + "\u0401\u040C\u040E\u042F\u0460\u0460\u0462\u0462\u0464\u0464\u0466\u0466"
-          + "\u0468\u0468\u046A\u046A\u046C\u046C\u046E\u046E\u0470\u0470\u0472\u0472"
-          + "\u0474\u0474\u0476\u0476\u0478\u0478\u047A\u047A\u047C\u047C\u047E\u047E"
-          + "\u0480\u0480\u0490\u0490\u0492\u0492\u0494\u0494\u0496\u0496\u0498\u0498"
-          + "\u049A\u049A\u049C\u049C\u049E\u049E\u04A0\u04A0\u04A2\u04A2\u04A4\u04A4"
-          + "\u04A6\u04A6\u04A8\u04A8\u04AA\u04AA\u04AC\u04AC\u04AE\u04AE\u04B0\u04B0"
-          + "\u04B2\u04B2\u04B4\u04B4\u04B6\u04B6\u04B8\u04B8\u04BA\u04BA\u04BC\u04BC"
-          + "\u04BE\u04BE\u04C1\u04C1\u04C3\u04C3\u04C7\u04C7\u04CB\u04CB\u04D0\u04D0"
-          + "\u04D2\u04D2\u04D4\u04D4\u04D6\u04D6\u04D8\u04D8\u04DA\u04DA\u04DC\u04DC"
-          + "\u04DE\u04DE\u04E0\u04E0\u04E2\u04E2\u04E4\u04E4\u04E6\u04E6\u04E8\u04E8"
-          + "\u04EA\u04EA\u04EE\u04EE\u04F0\u04F0\u04F2\u04F2\u04F4\u04F4\u04F8\u04F8"
-          + "\u0531\u0556\u10A0\u10C5\u1E00\u1E00\u1E02\u1E02\u1E04\u1E04\u1E06\u1E06"
-          + "\u1E08\u1E08\u1E0A\u1E0A\u1E0C\u1E0C\u1E0E\u1E0E\u1E10\u1E10\u1E12\u1E12"
-          + "\u1E14\u1E14\u1E16\u1E16\u1E18\u1E18\u1E1A\u1E1A\u1E1C\u1E1C\u1E1E\u1E1E"
-          + "\u1E20\u1E20\u1E22\u1E22\u1E24\u1E24\u1E26\u1E26\u1E28\u1E28\u1E2A\u1E2A"
-          + "\u1E2C\u1E2C\u1E2E\u1E2E\u1E30\u1E30\u1E32\u1E32\u1E34\u1E34\u1E36\u1E36"
-          + "\u1E38\u1E38\u1E3A\u1E3A\u1E3C\u1E3C\u1E3E\u1E3E\u1E40\u1E40\u1E42\u1E42"
-          + "\u1E44\u1E44\u1E46\u1E46\u1E48\u1E48\u1E4A\u1E4A\u1E4C\u1E4C\u1E4E\u1E4E"
-          + "\u1E50\u1E50\u1E52\u1E52\u1E54\u1E54\u1E56\u1E56\u1E58\u1E58\u1E5A\u1E5A"
-          + "\u1E5C\u1E5C\u1E5E\u1E5E\u1E60\u1E60\u1E62\u1E62\u1E64\u1E64\u1E66\u1E66"
-          + "\u1E68\u1E68\u1E6A\u1E6A\u1E6C\u1E6C\u1E6E\u1E6E\u1E70\u1E70\u1E72\u1E72"
-          + "\u1E74\u1E74\u1E76\u1E76\u1E78\u1E78\u1E7A\u1E7A\u1E7C\u1E7C\u1E7E\u1E7E"
-          + "\u1E80\u1E80\u1E82\u1E82\u1E84\u1E84\u1E86\u1E86\u1E88\u1E88\u1E8A\u1E8A"
-          + "\u1E8C\u1E8C\u1E8E\u1E8E\u1E90\u1E90\u1E92\u1E92\u1E94\u1E94\u1EA0\u1EA0"
-          + "\u1EA2\u1EA2\u1EA4\u1EA4\u1EA6\u1EA6\u1EA8\u1EA8\u1EAA\u1EAA\u1EAC\u1EAC"
-          + "\u1EAE\u1EAE\u1EB0\u1EB0\u1EB2\u1EB2\u1EB4\u1EB4\u1EB6\u1EB6\u1EB8\u1EB8"
-          + "\u1EBA\u1EBA\u1EBC\u1EBC\u1EBE\u1EBE\u1EC0\u1EC0\u1EC2\u1EC2\u1EC4\u1EC4"
-          + "\u1EC6\u1EC6\u1EC8\u1EC8\u1ECA\u1ECA\u1ECC\u1ECC\u1ECE\u1ECE\u1ED0\u1ED0"
-          + "\u1ED2\u1ED2\u1ED4\u1ED4\u1ED6\u1ED6\u1ED8\u1ED8\u1EDA\u1EDA\u1EDC\u1EDC"
-          + "\u1EDE\u1EDE\u1EE0\u1EE0\u1EE2\u1EE2\u1EE4\u1EE4\u1EE6\u1EE6\u1EE8\u1EE8"
-          + "\u1EEA\u1EEA\u1EEC\u1EEC\u1EEE\u1EEE\u1EF0\u1EF0\u1EF2\u1EF2\u1EF4\u1EF4"
-          + "\u1EF6\u1EF6\u1EF8\u1EF8\u1F08\u1F0F\u1F18\u1F1D\u1F28\u1F2F\u1F38\u1F3F"
-          + "\u1F48\u1F4D\u1F59\u1F59\u1F5B\u1F5B\u1F5D\u1F5D\u1F5F\u1F5F\u1F68\u1F6F"
-          + "\u1F88\u1F8F\u1F98\u1F9F\u1FA8\u1FAF\u1FB8\u1FBC\u1FBE\u1FBE\u1FC8\u1FCC"
-          + "\u1FD8\u1FDB\u1FE8\u1FEC\u1FF8\u1FFC\u2102\u2102\u2107\u2107\u210B\u210D"
-          + "\u2110\u2112\u2115\u2115\u2118\u211D\u2124\u2124\u2126\u2126\u2128\u2128"
-          + "\u212A\u212D\u2130\u2131\u2133\u2133\uFF21\uFF3A" },
-        { "Lt", "\u01C5\u01C5\u01C8\u01C8\u01CB\u01CB\u01F2\u01F2" },
-        { "Lo", "\u01AA\u01AA\u01BB\u01BB\u01BE\u01C3\u03F3\u03F3\u04C0\u04C0\u05D0\u05EA"
-          + "\u05F0\u05F2\u0621\u063A\u0641\u064A\u0671\u06B7\u06BA\u06BE\u06C0\u06CE"
-          + "\u06D0\u06D3\u06D5\u06D5\u0905\u0939\u093D\u093D\u0958\u0961\u0985\u098C"
-          + "\u098F\u0990\u0993\u09A8\u09AA\u09B0\u09B2\u09B2\u09B6\u09B9\u09DC\u09DD"
-          + "\u09DF\u09E1\u09F0\u09F1\u0A05\u0A0A\u0A0F\u0A10\u0A13\u0A28\u0A2A\u0A30"
-          + "\u0A32\u0A33\u0A35\u0A36\u0A38\u0A39\u0A59\u0A5C\u0A5E\u0A5E\u0A72\u0A74"
-          + "\u0A85\u0A8B\u0A8D\u0A8D\u0A8F\u0A91\u0A93\u0AA8\u0AAA\u0AB0\u0AB2\u0AB3"
-          + "\u0AB5\u0AB9\u0ABD\u0ABD\u0AE0\u0AE0\u0B05\u0B0C\u0B0F\u0B10\u0B13\u0B28"
-          + "\u0B2A\u0B30\u0B32\u0B33\u0B36\u0B39\u0B3D\u0B3D\u0B5C\u0B5D\u0B5F\u0B61"
-          + "\u0B85\u0B8A\u0B8E\u0B90\u0B92\u0B95\u0B99\u0B9A\u0B9C\u0B9C\u0B9E\u0B9F"
-          + "\u0BA3\u0BA4\u0BA8\u0BAA\u0BAE\u0BB5\u0BB7\u0BB9\u0C05\u0C0C\u0C0E\u0C10"
-          + "\u0C12\u0C28\u0C2A\u0C33\u0C35\u0C39\u0C60\u0C61\u0C85\u0C8C\u0C8E\u0C90"
-          + "\u0C92\u0CA8\u0CAA\u0CB3\u0CB5\u0CB9\u0CDE\u0CDE\u0CE0\u0CE1\u0D05\u0D0C"
-          + "\u0D0E\u0D10\u0D12\u0D28\u0D2A\u0D39\u0D60\u0D61\u0E01\u0E2E\u0E30\u0E30"
-          + "\u0E32\u0E33\u0E40\u0E45\u0E81\u0E82\u0E84\u0E84\u0E87\u0E88\u0E8A\u0E8A"
-          + "\u0E8D\u0E8D\u0E94\u0E97\u0E99\u0E9F\u0EA1\u0EA3\u0EA5\u0EA5\u0EA7\u0EA7"
-          + "\u0EAA\u0EAB\u0EAD\u0EAE\u0EB0\u0EB0\u0EB2\u0EB3\u0EBD\u0EBD\u0EC0\u0EC4"
-          + "\u0EDC\u0EDD\u0F40\u0F47\u0F49\u0F69\u1100\u1159\u115F\u11A2\u11A8\u11F9"
-          + "\u2135\u2138\u3041\u3094\u30A1\u30FA\u3105\u312C\u3131\u318E\u4E00\u9FA5"
-          + "\uAC00\uD7A3\uF900\uFA2D\uFB1F\uFB28\uFB2A\uFB36\uFB38\uFB3C\uFB3E\uFB3E"
-          + "\uFB40\uFB41\uFB43\uFB44\uFB46\uFBB1\uFBD3\uFD3D\uFD50\uFD8F\uFD92\uFDC7"
-          + "\uFDF0\uFDFB\uFE70\uFE72\uFE74\uFE74\uFE76\uFEFC\uFF66\uFF6F\uFF71\uFF9D"
-          + "\uFFA0\uFFBE\uFFC2\uFFC7\uFFCA\uFFCF\uFFD2\uFFD7\uFFDA\uFFDC" },
-        { "Lm", "\u02B0\u02B8\u02BB\u02C1\u02D0\u02D1\u02E0\u02E4\u037A\u037A\u0559\u0559"
-          + "\u0640\u0640\u06E5\u06E6\u0E46\u0E46\u0EC6\u0EC6\u3005\u3005\u3031\u3035"
-          + "\u309B\u309E\u30FC\u30FE\uFF70\uFF70\uFF9E\uFF9F" },
-        { "Nd", "09\u0660\u0669\u06F0\u06F9\u0966\u096F\u09E6\u09EF\u0A66\u0A6F\u0AE6\u0AEF"
-          + "\u0B66\u0B6F\u0BE7\u0BEF\u0C66\u0C6F\u0CE6\u0CEF\u0D66\u0D6F\u0E50\u0E59"
-          + "\u0ED0\u0ED9\u0F20\u0F29\uFF10\uFF19" },
-        { "Nl", "\u2160\u2182\u3007\u3007\u3021\u3029" },
-        { "No", "\u00B2\u00B3\u00B9\u00B9\u00BC\u00BE\u09F4\u09F9\u0BF0\u0BF2\u0F2A\u0F33"
-          + "\u2070\u2070\u2074\u2079\u2080\u2089\u2153\u215F\u2460\u249B\u24EA\u24EA"
-          + "\u2776\u2793\u3192\u3195\u3220\u3229\u3280\u3289" },
-        { "Ps", "(([[{{\u00AB\u00AB\u0F3A\u0F3A\u0F3C\u0F3C\u2018\u2018\u201A"
-          + "\u201C\u201E\u201F\u2039\u2039\u2045\u2045\u207D\u207D\u208D\u208D\u2329"
-          + "\u2329\u3008\u3008\u300A\u300A\u300C\u300C\u300E\u300E\u3010\u3010\u3014"
-          + "\u3014\u3016\u3016\u3018\u3018\u301A\u301A\u301D\u301D\u301F\u301F\uFD3E"
-          + "\uFD3E\uFE35\uFE35\uFE37\uFE37\uFE39\uFE39\uFE3B\uFE3B\uFE3D\uFE3D\uFE3F"
-          + "\uFE3F\uFE41\uFE41\uFE43\uFE43\uFE59\uFE59\uFE5B\uFE5B\uFE5D\uFE5D\uFF08"
-          + "\uFF08\uFF3B\uFF3B\uFF5B\uFF5B\uFF62\uFF62" },
-        { "Pe", "))]]}}\u00BB\u00BB\u0F3B\u0F3B\u0F3D\u0F3D\u2019\u2019\u201D\u201D\u203A"
-          + "\u203A\u2046\u2046\u207E\u207E\u208E\u208E\u232A\u232A\u3009\u3009\u300B"
-          + "\u300B\u300D\u300D\u300F\u300F\u3011\u3011\u3015\u3015\u3017\u3017\u3019"
-          + "\u3019\u301B\u301B\u301E\u301E\uFD3F\uFD3F\uFE36\uFE36\uFE38\uFE38\uFE3A"
-          + "\uFE3A\uFE3C\uFE3C\uFE3E\uFE3E\uFE40\uFE40\uFE42\uFE42\uFE44\uFE44\uFE5A"
-          + "\uFE5A\uFE5C\uFE5C\uFE5E\uFE5E\uFF09\uFF09\uFF3D\uFF3D\uFF5D\uFF5D\uFF63"
-          + "\uFF63" },
-        { "Pd", "--\u00AD\u00AD\u2010\u2015\u301C\u301C\u3030\u3030\uFE31\uFE32\uFE58\uFE58"
-          + "\uFE63\uFE63\uFF0D\uFF0D" },
-        { "Pc", "__\u203F\u2040\uFE33\uFE34\uFE4D\uFE4F\uFF3F\uFF3F" },
-        { "Po", "!#%'**,,./:;?@\\\\\u00A1\u00A1\u00B7\u00B7\u00BF\u00BF\u0374\u0375\u037E"
-          + "\u037E\u0387\u0387\u055A\u055F\u0589\u0589\u05BE\u05BE\u05C0\u05C0\u05C3"
-          + "\u05C3\u05F3\u05F4\u060C\u060C\u061B\u061B\u061F\u061F\u066A\u066D\u06D4"
-          + "\u06D4\u0964\u0965\u0970\u0970\u0E2F\u0E2F\u0E5A\u0E5B\u0EAF\u0EAF\u0F04"
-          + "\u0F12\u0F85\u0F85\u10FB\u10FB\u2016\u2017\u2020\u2027\u2030\u2038\u203B"
-          + "\u203E\u2041\u2043\u3001\u3003\u3006\u3006\u30FB\u30FB\uFE30\uFE30\uFE49"
-          + "\uFE4C\uFE50\uFE52\uFE54\uFE57\uFE5F\uFE61\uFE68\uFE68\uFE6A\uFE6B\uFF01"
-          + "\uFF03\uFF05\uFF07\uFF0A\uFF0A\uFF0C\uFF0C\uFF0E\uFF0F\uFF1A\uFF1B\uFF1F"
-          + "\uFF20\uFF3C\uFF3C\uFF61\uFF61\uFF64\uFF65" },
-        { "Sc", "$$\u00A2\u00A5\u09F2\u09F3\u0E3F\u0E3F\u20A0\u20AB\uFE69\uFE69\uFF04\uFF04"
-          + "\uFFE0\uFFE1\uFFE5\uFFE6" },
-        { "Sm", "++<>||~~\u00AC\u00AC\u00B1\u00B1\u00D7\u00D7\u00F7\u00F7\u2044\u2044\u207A"
-          + "\u207C\u208A\u208C\u2190\u2194\u21D2\u21D2\u21D4\u21D4\u2200\u22F1\u2308"
-          + "\u230B\u2320\u2321\uFB29\uFB29\uFE62\uFE62\uFE64\uFE66\uFF0B\uFF0B\uFF1C"
-          + "\uFF1E\uFF5C\uFF5C\uFF5E\uFF5E\uFFE2\uFFE2\uFFE8\uFFEC" },
-        { "So", "\u00A6\u00A7\u00A9\u00A9\u00AE\u00AE\u00B0\u00B0\u00B6\u00B6\u0482\u0482"
-          + "\u06E9\u06E9\u0950\u0950\u09FA\u09FA\u0AD0\u0AD0\u0B70\u0B70\u0E4F\u0E4F"
-          + "\u0F00\u0F03\u0F13\u0F17\u0F1A\u0F1F\u0F34\u0F34\u0F36\u0F36\u0F38\u0F38"
-          + "\u2100\u2101\u2103\u2106\u2108\u2109\u2114\u2114\u2116\u2117\u211E\u2123"
-          + "\u2125\u2125\u2127\u2127\u2129\u2129\u2132\u2132\u2195\u21D1\u21D3\u21D3"
-          + "\u21D5\u21EA\u2300\u2300\u2302\u2307\u230C\u231F\u2322\u2328\u232B\u237A"
-          + "\u2400\u2424\u2440\u244A\u249C\u24E9\u2500\u2595\u25A0\u25EF\u2600\u2613"
-          + "\u261A\u266F\u2701\u2704\u2706\u2709\u270C\u2727\u2729\u274B\u274D\u274D"
-          + "\u274F\u2752\u2756\u2756\u2758\u275E\u2761\u2767\u2794\u2794\u2798\u27AF"
-          + "\u27B1\u27BE\u3004\u3004\u3012\u3013\u3020\u3020\u3036\u3037\u303F\u303F"
-          + "\u3190\u3191\u3196\u319F\u3200\u321C\u322A\u3243\u3260\u327B\u327F\u327F"
-          + "\u328A\u32B0\u32C0\u32CB\u32D0\u32FE\u3300\u3376\u337B\u33DD\u33E0\u33FE"
-          + "\uFFE4\uFFE4\uFFED\uFFEE\uFFFD\uFFFD" },
-        { "Mn", "\u0300\u0345\u0360\u0361\u0483\u0486\u0591\u05A1\u05A3\u05B9\u05BB\u05BD"
-          + "\u05BF\u05BF\u05C1\u05C2\u05C4\u05C4\u064B\u0652\u0670\u0670\u06D6\u06DC"
-          + "\u06DF\u06E4\u06E7\u06E8\u06EA\u06ED\u0901\u0902\u093C\u093C\u0941\u0948"
-          + "\u094D\u094D\u0951\u0954\u0962\u0963\u0981\u0981\u09BC\u09BC\u09C1\u09C4"
-          + "\u09CD\u09CD\u09E2\u09E3\u0A02\u0A02\u0A3C\u0A3C\u0A41\u0A42\u0A47\u0A48"
-          + "\u0A4B\u0A4D\u0A70\u0A71\u0A81\u0A82\u0ABC\u0ABC\u0AC1\u0AC5\u0AC7\u0AC8"
-          + "\u0ACD\u0ACD\u0B01\u0B01\u0B3C\u0B3C\u0B3F\u0B3F\u0B41\u0B43\u0B4D\u0B4D"
-          + "\u0B56\u0B56\u0B82\u0B82\u0BC0\u0BC0\u0BCD\u0BCD\u0C3E\u0C40\u0C46\u0C48"
-          + "\u0C4A\u0C4D\u0C55\u0C56\u0CBF\u0CBF\u0CC6\u0CC6\u0CCC\u0CCD\u0D41\u0D43"
-          + "\u0D4D\u0D4D\u0E31\u0E31\u0E34\u0E3A\u0E47\u0E4E\u0EB1\u0EB1\u0EB4\u0EB9"
-          + "\u0EBB\u0EBC\u0EC8\u0ECD\u0F18\u0F19\u0F35\u0F35\u0F37\u0F37\u0F39\u0F39"
-          + "\u0F71\u0F7E\u0F80\u0F84\u0F86\u0F8B\u0F90\u0F95\u0F97\u0F97\u0F99\u0FAD"
-          + "\u0FB1\u0FB7\u0FB9\u0FB9\u20D0\u20DC\u20E1\u20E1\u302A\u302F\u3099\u309A"
-          + "\uFB1E\uFB1E\uFE20\uFE23" },
-        { "Mc", "\u0903\u0903\u093E\u0940\u0949\u094C\u0982\u0983\u09BE\u09C0\u09C7\u09C8"
-          + "\u09CB\u09CC\u09D7\u09D7\u0A3E\u0A40\u0A83\u0A83\u0ABE\u0AC0\u0AC9\u0AC9"
-          + "\u0ACB\u0ACC\u0B02\u0B03\u0B3E\u0B3E\u0B40\u0B40\u0B47\u0B48\u0B4B\u0B4C"
-          + "\u0B57\u0B57\u0B83\u0B83\u0BBE\u0BBF\u0BC1\u0BC2\u0BC6\u0BC8\u0BCA\u0BCC"
-          + "\u0BD7\u0BD7\u0C01\u0C03\u0C41\u0C44\u0C82\u0C83\u0CBE\u0CBE\u0CC0\u0CC4"
-          + "\u0CC7\u0CC8\u0CCA\u0CCB\u0CD5\u0CD6\u0D02\u0D03\u0D3E\u0D40\u0D46\u0D48"
-          + "\u0D4A\u0D4C\u0D57\u0D57\u0F3E\u0F3F\u0F7F\u0F7F" },
-        { "Me", "\u06DD\u06DE\u20DD\u20E0" },
-        { "Zl", "\u2028\u2028" },
-        { "Zp", "\u2029\u2029" },
-        { "Zs", "\u0020\u0020\u00A0\u00A0\u2000\u200B\u3000\u3000" },
-        { "Cc", "\u0000\u001F\u007F\u009F" },
-        { "Cf", "\u200C\u200F\u202A\u202E\u206A\u206F\uFEFF\uFEFF" }
-    };
-}