2017-10-03 02:32:50 +00:00
|
|
|
// © 2017 and later: Unicode, Inc. and others.
|
|
|
|
// License & terms of use: http://www.unicode.org/copyright.html
|
1999-12-10 01:44:19 +00:00
|
|
|
/*
|
|
|
|
*******************************************************************************
|
1999-12-13 22:25:50 +00:00
|
|
|
*
|
2012-01-03 23:20:55 +00:00
|
|
|
* Copyright (C) 1999-2012, International Business Machines
|
1999-12-13 22:25:50 +00:00
|
|
|
* Corporation and others. All Rights Reserved.
|
|
|
|
*
|
1999-12-10 01:44:19 +00:00
|
|
|
*******************************************************************************
|
2010-07-27 23:32:04 +00:00
|
|
|
* file name: genprops.cpp
|
1999-12-10 01:44:19 +00:00
|
|
|
* encoding: US-ASCII
|
|
|
|
* tab size: 8 (not used)
|
|
|
|
* indentation:4
|
|
|
|
*
|
|
|
|
* created on: 1999dec08
|
|
|
|
* created by: Markus W. Scherer
|
|
|
|
*
|
2011-12-18 06:53:54 +00:00
|
|
|
* This program parses the ppucd.txt preparsed Unicode Character Database file
|
|
|
|
* and writes several source and binary files into the ICU source tree.
|
1999-12-10 01:44:19 +00:00
|
|
|
*/
|
|
|
|
|
|
|
|
#include <stdio.h>
|
|
|
|
#include <stdlib.h>
|
1999-12-28 23:57:50 +00:00
|
|
|
#include "unicode/utypes.h"
|
2011-12-16 06:51:58 +00:00
|
|
|
#include "unicode/localpointer.h"
|
|
|
|
#include "unicode/uniset.h"
|
|
|
|
#include "unicode/unistr.h"
|
|
|
|
#include "charstr.h"
|
|
|
|
#include "genprops.h"
|
|
|
|
#include "ppucd.h"
|
|
|
|
#include "toolutil.h"
|
2000-04-18 16:56:02 +00:00
|
|
|
#include "uoptions.h"
|
1999-12-10 01:44:19 +00:00
|
|
|
|
2010-07-27 23:32:04 +00:00
|
|
|
U_NAMESPACE_USE
|
|
|
|
|
2011-12-18 00:37:18 +00:00
|
|
|
UBool beVerbose=FALSE;
|
2012-01-03 23:20:55 +00:00
|
|
|
UBool beQuiet=FALSE;
|
1999-12-10 01:44:19 +00:00
|
|
|
|
2011-12-19 01:49:34 +00:00
|
|
|
PropsBuilder::PropsBuilder() {}
|
|
|
|
PropsBuilder::~PropsBuilder() {}
|
|
|
|
void PropsBuilder::setUnicodeVersion(const UVersionInfo) {}
|
2012-01-03 23:20:55 +00:00
|
|
|
void PropsBuilder::setAlgNamesRange(UChar32, UChar32,
|
|
|
|
const char *, const char *, UErrorCode &) {}
|
2011-12-19 01:49:34 +00:00
|
|
|
void PropsBuilder::setProps(const UniProps &, const UnicodeSet &, UErrorCode &) {}
|
|
|
|
void PropsBuilder::build(UErrorCode &) {}
|
|
|
|
void PropsBuilder::writeCSourceFile(const char *, UErrorCode &) {}
|
|
|
|
void PropsBuilder::writeBinaryData(const char *, UBool, UErrorCode &) {}
|
2011-12-16 06:51:58 +00:00
|
|
|
|
2011-12-18 03:21:54 +00:00
|
|
|
enum {
|
2003-08-26 17:41:02 +00:00
|
|
|
HELP_H,
|
|
|
|
HELP_QUESTION_MARK,
|
|
|
|
VERBOSE,
|
2012-01-03 23:20:55 +00:00
|
|
|
QUIET,
|
2011-12-18 06:53:54 +00:00
|
|
|
COPYRIGHT
|
2003-08-26 17:41:02 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
/* Keep these values in sync with the above enums */
|
2000-04-18 16:56:02 +00:00
|
|
|
static UOption options[]={
|
|
|
|
UOPTION_HELP_H,
|
|
|
|
UOPTION_HELP_QUESTION_MARK,
|
|
|
|
UOPTION_VERBOSE,
|
2012-01-03 23:20:55 +00:00
|
|
|
UOPTION_QUIET,
|
2011-12-18 06:53:54 +00:00
|
|
|
UOPTION_COPYRIGHT
|
2000-04-18 16:56:02 +00:00
|
|
|
};
|
1999-12-10 01:44:19 +00:00
|
|
|
|
2000-04-18 16:56:02 +00:00
|
|
|
extern int
|
2000-09-21 21:49:32 +00:00
|
|
|
main(int argc, char* argv[]) {
|
2002-03-15 23:41:40 +00:00
|
|
|
U_MAIN_INIT_ARGS(argc, argv);
|
2011-12-18 00:37:18 +00:00
|
|
|
argc=u_parseArgs(argc, argv, LENGTHOF(options), options);
|
2000-04-18 16:56:02 +00:00
|
|
|
|
|
|
|
/* error handling, printing usage message */
|
|
|
|
if(argc<0) {
|
1999-12-10 01:44:19 +00:00
|
|
|
fprintf(stderr,
|
2000-04-18 16:56:02 +00:00
|
|
|
"error in command line argument \"%s\"\n",
|
|
|
|
argv[-argc]);
|
|
|
|
}
|
2011-12-18 00:37:18 +00:00
|
|
|
if(argc<2 || options[HELP_H].doesOccur || options[HELP_QUESTION_MARK].doesOccur) {
|
2001-11-20 03:27:44 +00:00
|
|
|
/*
|
2011-12-18 00:37:18 +00:00
|
|
|
* Broken into chunks because the C89 standard says the minimum
|
2001-11-20 03:27:44 +00:00
|
|
|
* required supported string length is 509 bytes.
|
|
|
|
*/
|
2000-04-18 16:56:02 +00:00
|
|
|
fprintf(stderr,
|
2011-12-18 00:37:18 +00:00
|
|
|
"Usage: %s [-options] path/to/ICU/src/root\n"
|
2001-11-20 03:27:44 +00:00
|
|
|
"\n"
|
2011-12-18 00:37:18 +00:00
|
|
|
"Reads the preparsed UCD file path/to/ICU/src/root/source/data/unidata/ppucd.txt and\n"
|
|
|
|
"writes source and binary data files with the character properties.\n"
|
|
|
|
"(UCD=Unicode Character Database)\n"
|
2001-11-20 03:27:44 +00:00
|
|
|
"\n",
|
1999-12-10 01:44:19 +00:00
|
|
|
argv[0]);
|
2001-11-20 03:27:44 +00:00
|
|
|
fprintf(stderr,
|
|
|
|
"Options:\n"
|
|
|
|
"\t-h or -? or --help this usage text\n"
|
|
|
|
"\t-v or --verbose verbose output\n"
|
2012-01-03 23:20:55 +00:00
|
|
|
"\t-q or --quiet no output\n"
|
2011-12-18 00:37:18 +00:00
|
|
|
"\t-c or --copyright include a copyright notice\n");
|
|
|
|
return argc<2 ? U_ILLEGAL_ARGUMENT_ERROR : U_ZERO_ERROR;
|
1999-12-10 01:44:19 +00:00
|
|
|
}
|
|
|
|
|
2000-04-18 16:56:02 +00:00
|
|
|
/* get the options values */
|
2003-08-26 17:41:02 +00:00
|
|
|
beVerbose=options[VERBOSE].doesOccur;
|
2012-01-03 23:20:55 +00:00
|
|
|
beQuiet=options[QUIET].doesOccur;
|
1999-12-10 01:44:19 +00:00
|
|
|
|
2011-12-16 06:51:58 +00:00
|
|
|
/* initialize */
|
|
|
|
IcuToolErrorCode errorCode("genprops");
|
2011-12-19 01:49:34 +00:00
|
|
|
LocalPointer<PNamesBuilder> pnamesBuilder(createPNamesBuilder(errorCode));
|
|
|
|
LocalPointer<PropsBuilder> corePropsBuilder(createCorePropsBuilder(errorCode));
|
2011-12-25 01:25:50 +00:00
|
|
|
LocalPointer<PropsBuilder> bidiPropsBuilder(createBiDiPropsBuilder(errorCode));
|
2012-01-10 07:23:44 +00:00
|
|
|
LocalPointer<PropsBuilder> casePropsBuilder(createCasePropsBuilder(errorCode));
|
2012-01-03 23:20:55 +00:00
|
|
|
LocalPointer<PropsBuilder> namesPropsBuilder(createNamesPropsBuilder(errorCode));
|
2011-12-16 06:51:58 +00:00
|
|
|
if(errorCode.isFailure()) {
|
2011-12-19 01:49:34 +00:00
|
|
|
fprintf(stderr, "genprops: unable to create PropsBuilders - %s\n", errorCode.errorName());
|
2011-12-16 06:51:58 +00:00
|
|
|
return errorCode.reset();
|
|
|
|
}
|
|
|
|
|
2011-12-18 00:37:18 +00:00
|
|
|
CharString icuSrcRoot(argv[1], errorCode);
|
|
|
|
|
|
|
|
CharString icuSource(icuSrcRoot, errorCode);
|
|
|
|
icuSource.appendPathPart("source", errorCode);
|
|
|
|
|
|
|
|
CharString icuSourceData(icuSource, errorCode);
|
|
|
|
icuSourceData.appendPathPart("data", errorCode);
|
|
|
|
|
|
|
|
CharString ppucdPath(icuSourceData, errorCode);
|
|
|
|
ppucdPath.appendPathPart("unidata", errorCode);
|
2011-12-16 06:51:58 +00:00
|
|
|
ppucdPath.appendPathPart("ppucd.txt", errorCode);
|
|
|
|
|
|
|
|
PreparsedUCD ppucd(ppucdPath.data(), errorCode);
|
|
|
|
if(errorCode.isFailure()) {
|
|
|
|
fprintf(stderr, "genprops: unable to open %s - %s\n",
|
|
|
|
ppucdPath.data(), errorCode.errorName());
|
|
|
|
return errorCode.reset();
|
|
|
|
}
|
2011-12-18 21:33:57 +00:00
|
|
|
|
2011-12-19 01:49:34 +00:00
|
|
|
// The PNamesBuilder uses preparsed pnames_data.h.
|
|
|
|
pnamesBuilder->build(errorCode);
|
2011-12-18 21:33:57 +00:00
|
|
|
if(U_FAILURE(errorCode)) {
|
2011-12-19 01:49:34 +00:00
|
|
|
fprintf(stderr, "genprops: PNamesBuilder::build() failed - %s\n",
|
2011-12-18 21:33:57 +00:00
|
|
|
errorCode.errorName());
|
|
|
|
return errorCode.reset();
|
|
|
|
}
|
2011-12-19 01:49:34 +00:00
|
|
|
ppucd.setPropertyNames(pnamesBuilder->getPropertyNames());
|
2011-12-18 21:33:57 +00:00
|
|
|
|
2011-12-16 06:51:58 +00:00
|
|
|
PreparsedUCD::LineType lineType;
|
|
|
|
UnicodeSet newValues;
|
|
|
|
while((lineType=ppucd.readLine(errorCode))!=PreparsedUCD::NO_LINE) {
|
|
|
|
if(ppucd.lineHasPropertyValues()) {
|
|
|
|
const UniProps *props=ppucd.getProps(newValues, errorCode);
|
2011-12-19 01:49:34 +00:00
|
|
|
corePropsBuilder->setProps(*props, newValues, errorCode);
|
2011-12-25 01:25:50 +00:00
|
|
|
bidiPropsBuilder->setProps(*props, newValues, errorCode);
|
2012-01-10 07:23:44 +00:00
|
|
|
casePropsBuilder->setProps(*props, newValues, errorCode);
|
2012-01-03 23:20:55 +00:00
|
|
|
namesPropsBuilder->setProps(*props, newValues, errorCode);
|
2011-12-16 06:51:58 +00:00
|
|
|
} else if(lineType==PreparsedUCD::UNICODE_VERSION_LINE) {
|
|
|
|
const UVersionInfo &version=ppucd.getUnicodeVersion();
|
2011-12-19 01:49:34 +00:00
|
|
|
corePropsBuilder->setUnicodeVersion(version);
|
2011-12-25 01:25:50 +00:00
|
|
|
bidiPropsBuilder->setUnicodeVersion(version);
|
2012-01-10 07:23:44 +00:00
|
|
|
casePropsBuilder->setUnicodeVersion(version);
|
2012-01-03 23:20:55 +00:00
|
|
|
namesPropsBuilder->setUnicodeVersion(version);
|
|
|
|
} else if(lineType==PreparsedUCD::ALG_NAMES_RANGE_LINE) {
|
|
|
|
UChar32 start, end;
|
|
|
|
if(ppucd.getRangeForAlgNames(start, end, errorCode)) {
|
|
|
|
const char *type=ppucd.nextField();
|
|
|
|
const char *prefix=ppucd.nextField(); // NULL if type==hangul
|
|
|
|
namesPropsBuilder->setAlgNamesRange(start, end, type, prefix, errorCode);
|
|
|
|
}
|
2011-12-16 06:51:58 +00:00
|
|
|
}
|
2011-12-17 05:03:26 +00:00
|
|
|
if(errorCode.isFailure()) {
|
|
|
|
fprintf(stderr,
|
|
|
|
"genprops: error parsing or setting values from ppucd.txt line %ld - %s\n",
|
|
|
|
(long)ppucd.getLineNumber(), errorCode.errorName());
|
|
|
|
return errorCode.reset();
|
|
|
|
}
|
2011-12-16 06:51:58 +00:00
|
|
|
}
|
|
|
|
|
2011-12-19 01:49:34 +00:00
|
|
|
corePropsBuilder->build(errorCode);
|
2011-12-25 01:25:50 +00:00
|
|
|
bidiPropsBuilder->build(errorCode);
|
2012-01-10 07:23:44 +00:00
|
|
|
casePropsBuilder->build(errorCode);
|
2012-01-03 23:20:55 +00:00
|
|
|
namesPropsBuilder->build(errorCode);
|
2011-12-18 00:37:18 +00:00
|
|
|
if(errorCode.isFailure()) {
|
|
|
|
fprintf(stderr, "genprops error: failure finalizing the data - %s\n",
|
|
|
|
errorCode.errorName());
|
|
|
|
return errorCode.reset();
|
2000-04-18 16:56:02 +00:00
|
|
|
}
|
|
|
|
|
2011-12-18 00:37:18 +00:00
|
|
|
// Write the files with the generated data.
|
|
|
|
CharString sourceCommon(icuSource, errorCode);
|
|
|
|
sourceCommon.appendPathPart("common", errorCode);
|
|
|
|
|
|
|
|
CharString sourceDataIn(icuSourceData, errorCode);
|
|
|
|
sourceDataIn.appendPathPart("in", errorCode);
|
|
|
|
|
|
|
|
UBool withCopyright=options[COPYRIGHT].doesOccur;
|
|
|
|
|
2011-12-19 01:49:34 +00:00
|
|
|
pnamesBuilder->writeCSourceFile(sourceCommon.data(), errorCode);
|
|
|
|
pnamesBuilder->writeBinaryData(sourceDataIn.data(), withCopyright, errorCode);
|
|
|
|
corePropsBuilder->writeCSourceFile(sourceCommon.data(), errorCode);
|
|
|
|
corePropsBuilder->writeBinaryData(sourceDataIn.data(), withCopyright, errorCode);
|
2011-12-25 01:25:50 +00:00
|
|
|
bidiPropsBuilder->writeCSourceFile(sourceCommon.data(), errorCode);
|
|
|
|
bidiPropsBuilder->writeBinaryData(sourceDataIn.data(), withCopyright, errorCode);
|
2012-01-10 07:23:44 +00:00
|
|
|
casePropsBuilder->writeCSourceFile(sourceCommon.data(), errorCode);
|
|
|
|
casePropsBuilder->writeBinaryData(sourceDataIn.data(), withCopyright, errorCode);
|
2012-01-03 23:20:55 +00:00
|
|
|
namesPropsBuilder->writeBinaryData(sourceDataIn.data(), withCopyright, errorCode);
|
2011-12-18 00:37:18 +00:00
|
|
|
|
2000-04-18 16:56:02 +00:00
|
|
|
return errorCode;
|
1999-12-10 01:44:19 +00:00
|
|
|
}
|
|
|
|
|
2000-02-29 18:42:28 +00:00
|
|
|
/*
|
|
|
|
* Hey, Emacs, please set the following:
|
|
|
|
*
|
|
|
|
* Local Variables:
|
|
|
|
* indent-tabs-mode: nil
|
|
|
|
* End:
|
|
|
|
*
|
2003-09-15 21:29:51 +00:00
|
|
|
*/
|