2003-02-26 00:35:09 +00:00
|
|
|
/**
|
|
|
|
*******************************************************************************
|
|
|
|
* Copyright (C) 1996-2001, International Business Machines Corporation and *
|
|
|
|
* others. All Rights Reserved. *
|
|
|
|
*******************************************************************************
|
|
|
|
*
|
|
|
|
* $Source: /xsrl/Nsvn/icu/unicodetools/com/ibm/text/UCD/GenerateStandardizedVariants.java,v $
|
2004-02-12 08:23:19 +00:00
|
|
|
* $Date: 2004/02/12 08:23:15 $
|
|
|
|
* $Revision: 1.5 $
|
2003-02-26 00:35:09 +00:00
|
|
|
*
|
|
|
|
*******************************************************************************
|
|
|
|
*/
|
|
|
|
|
|
|
|
package com.ibm.text.UCD;
|
|
|
|
import com.ibm.text.utility.*;
|
|
|
|
import com.ibm.icu.text.UTF16;
|
|
|
|
import com.ibm.icu.text.UnicodeSet;
|
|
|
|
import java.util.*;
|
|
|
|
import java.io.*;
|
|
|
|
|
|
|
|
public final class GenerateStandardizedVariants implements UCD_Types {
|
|
|
|
|
2003-03-12 16:01:26 +00:00
|
|
|
static final boolean DEBUG = false;
|
|
|
|
|
|
|
|
static public String showVarGlyphs(String code0, String code1, String shape, String description) {
|
|
|
|
if (DEBUG) System.out.println(code0 + ", " + code1 + ", [" + shape + "]");
|
2003-02-26 00:35:09 +00:00
|
|
|
|
|
|
|
String abbShape = "";
|
|
|
|
if (shape.length() != 0) {
|
|
|
|
abbShape = '-' + shape.substring(0,4);
|
2003-03-12 16:01:26 +00:00
|
|
|
if (description.indexOf("feminine") >= 0) abbShape += "fem";
|
2003-02-26 00:35:09 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
return "<img alt='U+" + code0 + "+U+" + code1 + "/" + shape
|
|
|
|
+ "' src='http://www.unicode.org/cgi-bin/varglyph?24-" +code0 + "-" + code1 + abbShape + "'>";
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
# Field 0: the variation sequence
|
|
|
|
# Field 1: the description of the desired appearance
|
|
|
|
# Field 2: where the appearance is only different in in particular shaping environments
|
|
|
|
# this field lists them. The possible values are: isolated, initial, medial, final.
|
|
|
|
# If more than one is present, there are spaces between them.
|
|
|
|
*/
|
|
|
|
static public void generate() throws IOException {
|
2004-02-07 01:01:17 +00:00
|
|
|
|
2003-02-26 00:35:09 +00:00
|
|
|
|
|
|
|
// read the data and compose the table
|
|
|
|
|
|
|
|
String table = "<table><tr><th>Rep Glyph</th><th>Character Sequence</th><th>Context</th><th width='10%'>Alt Glyph</th><th>Description of variant appearance</th></tr>";
|
|
|
|
|
|
|
|
String[] splits = new String[4];
|
|
|
|
String[] codes = new String[2];
|
|
|
|
String[] shapes = new String[4];
|
|
|
|
|
2004-02-07 01:01:17 +00:00
|
|
|
BufferedReader in = Utility.openUnicodeFile("StandardizedVariants", Default.ucdVersion(), true, Utility.LATIN1);
|
2003-02-26 00:35:09 +00:00
|
|
|
while (true) {
|
|
|
|
String line = Utility.readDataLine(in);
|
|
|
|
if (line == null) break;
|
|
|
|
if (line.length() == 0) continue;
|
|
|
|
|
|
|
|
int count = Utility.split(line, ';', splits);
|
|
|
|
int codeCount = Utility.split(splits[0], ' ', codes);
|
|
|
|
int code = Utility.codePointFromHex(codes[0]);
|
|
|
|
|
|
|
|
// <img alt="03E2" src="http://www.unicode.org/cgi-bin/refglyph?24-03E2" style="vertical-align:middle">
|
|
|
|
|
|
|
|
table += "<tr><td><img alt='U+" + codes[0] + "' src='http://www.unicode.org/cgi-bin/refglyph?24-" + codes[0] + "'></td>\n";
|
|
|
|
table += "<td>" + splits[0] + "</td>\n";
|
|
|
|
|
|
|
|
String shape = splits[2].trim();
|
|
|
|
if (shape.equals("all")) shape = "";
|
|
|
|
|
|
|
|
table += "<td>" + Utility.replace(shape, " ", "<br>") + "</td>\n";
|
|
|
|
|
|
|
|
// http://www.unicode.org/cgi-bin/varglyph?24-1820-180B-fina
|
|
|
|
// http://www.unicode.org/cgi-bin/varglyph?24-222A-FE00
|
|
|
|
|
|
|
|
table += "<td>";
|
|
|
|
if (shape.length() == 0) {
|
2003-03-12 16:01:26 +00:00
|
|
|
table += showVarGlyphs(codes[0], codes[1], "", "");
|
2003-02-26 00:35:09 +00:00
|
|
|
} else {
|
|
|
|
int shapeCount = Utility.split(shape, ' ', shapes);
|
|
|
|
for (int i = 0; i < shapeCount; ++i) {
|
|
|
|
if (i != 0) table += " ";
|
2003-03-12 16:01:26 +00:00
|
|
|
table += showVarGlyphs(codes[0], codes[1], shapes[i], splits[1]);
|
2003-02-26 00:35:09 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
table += "</td>\n";
|
|
|
|
|
2004-02-07 01:01:17 +00:00
|
|
|
table += "<td>" + Default.ucd().getName(code) + " " + splits[1] + "</td>\n";
|
2003-02-26 00:35:09 +00:00
|
|
|
table += "</tr>";
|
|
|
|
}
|
|
|
|
in.close();
|
|
|
|
table += "</table>";
|
|
|
|
|
|
|
|
// now write out the results
|
|
|
|
|
|
|
|
String directory = "DerivedData/";
|
2004-02-12 08:23:19 +00:00
|
|
|
String filename = directory + "StandardizedVariants" + UnicodeDataFile.getHTMLFileSuffix(true);
|
2003-02-26 00:35:09 +00:00
|
|
|
PrintWriter out = Utility.openPrintWriter(filename, Utility.LATIN1_UNIX);
|
|
|
|
String[] batName = {""};
|
2004-02-12 08:23:19 +00:00
|
|
|
String mostRecent = UnicodeDataFile.generateBat(directory, filename, UnicodeDataFile.getFileSuffix(true), batName);
|
2003-02-26 00:35:09 +00:00
|
|
|
|
2004-02-07 01:01:17 +00:00
|
|
|
String version = Default.ucd().getVersion();
|
2003-03-12 16:01:26 +00:00
|
|
|
int lastDot = version.lastIndexOf('.');
|
|
|
|
String updateDirectory = version.substring(0,lastDot) + "-Update";
|
|
|
|
int updateV = version.charAt(version.length()-1) - '0';
|
|
|
|
if (updateV != 0) updateDirectory += (char)('1' + updateV);
|
|
|
|
if (DEBUG) System.out.println("updateDirectory: " + updateDirectory);
|
|
|
|
|
2003-02-26 00:35:09 +00:00
|
|
|
String[] replacementList = {
|
2004-02-07 01:01:17 +00:00
|
|
|
"@revision@", Default.ucd().getVersion(),
|
2003-03-12 16:01:26 +00:00
|
|
|
"@updateDirectory@", updateDirectory,
|
2003-02-26 00:35:09 +00:00
|
|
|
"@date@", Default.getDate(),
|
|
|
|
"@table@", table};
|
|
|
|
|
|
|
|
Utility.appendFile("StandardizedVariants-Template.html", Utility.UTF8, out, replacementList);
|
|
|
|
|
|
|
|
out.close();
|
|
|
|
Utility.renameIdentical(mostRecent, Utility.getOutputName(filename), batName[0]);
|
|
|
|
}
|
|
|
|
}
|