/* ******************************************************************************* * * Copyright (C) 1999-2001, International Business Machines * Corporation and others. All Rights Reserved. * ******************************************************************************* * file name: gencnval.c * encoding: US-ASCII * tab size: 8 (not used) * indentation:4 * * created on: 1999nov05 * created by: Markus W. Scherer * * This program reads convrtrs.txt and writes a memory-mappable * converter name alias table to cnvalias.dat . * * This program currently writes version 2.1 of the data format. See * ucnv_io.c for more details on the format. Note that version 2.1 * is written in such a way that a 2.0 reader will be able to use it, * and a 2.1 reader will be able to read 2.0. */ #include #include #include #include "unicode/utypes.h" #include "unicode/putil.h" #include "unicode/ucnv.h" /* ucnv_compareNames() */ #include "cmemory.h" #include "cstring.h" #include "filestrm.h" #include "unewdata.h" #include "uoptions.h" /* TODO: Need to specify the maximum alias name length in a header (see ucnv_io.c::findalias()) */ #define STRING_STORE_SIZE 100000 #define MAX_ALIAS_COUNT 2000 #define TAG_STORE_SIZE 20000 #define MAX_TAG_COUNT 200 #define DATA_NAME "cnvalias" #define DATA_TYPE "dat" /* UDataInfo cf. udata.h */ static const UDataInfo dataInfo={ sizeof(UDataInfo), 0, U_IS_BIG_ENDIAN, U_CHARSET_FAMILY, sizeof(UChar), 0, {0x43, 0x76, 0x41, 0x6c}, /* dataFormat="CvAl" */ {2, 1, 0, 0}, /* formatVersion */ {1, 4, 2, 0} /* dataVersion */ }; typedef struct { char *store; uint32_t top; uint32_t max; } StringBlock; static char stringStore[STRING_STORE_SIZE]; static StringBlock stringBlock = { stringStore, 0, STRING_STORE_SIZE }; typedef struct { const char *alias; uint16_t converter; } Alias; static Alias aliases[MAX_ALIAS_COUNT]; static uint16_t aliasCount=0; typedef struct { const char *converter; uint16_t aliasCount; } Converter; static Converter converters[MAX_ALIAS_COUNT]; static uint16_t converterCount=0; static char tagStore[TAG_STORE_SIZE]; static StringBlock tagBlock = { tagStore, 0, TAG_STORE_SIZE }; typedef struct { const char *tag; const char *aliases[MAX_ALIAS_COUNT]; } Tag; static Tag tags[MAX_TAG_COUNT]; static uint16_t tagCount = 0; /* prototypes --------------------------------------------------------------- */ static void parseLine(const char *line); static uint16_t addAlias(const char *alias, uint16_t converter); static uint16_t addConverter(const char *converter); static char * allocString(StringBlock *block, uint32_t length); static int compareAliases(const void *alias1, const void *alias2); static uint16_t getTagNumber(const char *tag, uint16_t tagLen); static void addTaggedAlias(uint16_t tag, const char *alias, uint16_t converter); /* -------------------------------------------------------------------------- */ static UOption options[]={ UOPTION_HELP_H, UOPTION_HELP_QUESTION_MARK, UOPTION_COPYRIGHT, UOPTION_DESTDIR, UOPTION_SOURCEDIR }; extern int main(int argc, char* argv[]) { char line[512]; const char *path; FileStream *in; UNewDataMemory *out; char *s; UErrorCode errorCode=U_ZERO_ERROR; int i; uint16_t tagOffset, stringOffset; U_MAIN_INIT_ARGS(argc, argv); /* preset then read command line options */ options[3].value=options[4].value=u_getDataDirectory(); argc=u_parseArgs(argc, argv, sizeof(options)/sizeof(options[0]), options); /* error handling, printing usage message */ if(argc<0) { fprintf(stderr, "error in command line argument \"%s\"\n", argv[-argc]); } if(argc<0 || options[0].doesOccur || options[1].doesOccur) { fprintf(stderr, "usage: %s [-options] [convrtrs.txt]\n" "\tread convrtrs.txt and create " DATA_NAME "." DATA_TYPE "\n" "options:\n" "\t-h or -? or --help this usage text\n" "\t-c or --copyright include a copyright notice\n" "\t-d or --destdir destination directory, followed by the path\n" "\t-s or --sourcedir source directory, followed by the path\n", argv[0]); return argc<0 ? U_ILLEGAL_ARGUMENT_ERROR : U_ZERO_ERROR; } if(argc>=2) { path=argv[1]; } else { path=options[4].value; if(path!=NULL && *path!=0) { uprv_strcpy(line, path); path=line+uprv_strlen(line); if(*(path-1)!=U_FILE_SEP_CHAR) { *((char *)path)=U_FILE_SEP_CHAR; ++path; } uprv_strcpy((char *)path, "convrtrs.txt"); path=line; } else { path = "convrtrs.txt"; } } in=T_FileStream_open(path, "r"); if(in==NULL) { fprintf(stderr, "gencnval: unable to open input file convrtrs.txt\n"); exit(U_FILE_ACCESS_ERROR); } /* read the list of aliases */ while(T_FileStream_readLine(in, line, sizeof(line))!=NULL) { /* remove trailing newline characters */ s=line; while(*s!=0) { if(*s=='\r' || *s=='\n') { *s=0; break; } ++s; } parseLine(line); } T_FileStream_close(in); /* sort the aliases */ qsort(aliases, aliasCount, sizeof(Alias), compareAliases); /* create the output file */ out=udata_create(options[3].value, DATA_TYPE, DATA_NAME, &dataInfo, options[2].doesOccur ? U_COPYRIGHT_STRING : NULL, &errorCode); if(U_FAILURE(errorCode)) { fprintf(stderr, "gencnval: unable to open output file - error %s\n", u_errorName(errorCode)); exit(errorCode); } /* determine the length of tables for the data offset of the strings */ tagOffset = (uint16_t)(2 + 4 * aliasCount + 2 + 4 * converterCount); stringOffset = (uint16_t)(tagOffset + 2 + (2 * tagCount) * converterCount + tagBlock.top); /* write the table of aliases */ udata_write16(out, aliasCount); for(i=0; i= MAX_TAG_COUNT) { fprintf(stderr, "gencnval: too many tags\n"); exit(U_BUFFER_OVERFLOW_ERROR); } for (t = 0; t < tagCount; ++t) { if (uprv_strlen(tags[t].tag) == tagLen && !uprv_strnicmp(tags[t].tag, tag, tagLen)) { return t; } } /* we need to add this tag */ if (tagCount >= MAX_TAG_COUNT) { fprintf(stderr, "gencnval: too many tags\n"); exit(U_BUFFER_OVERFLOW_ERROR); } /* allocate a new entry in the tag table */ atag = allocString(&tagBlock, tagLen + 1); uprv_memcpy(atag, tag, tagLen); atag[tagLen] = 0; /* add the tag to the tag table */ tags[tagCount].tag = atag; /* Set the array of pointers to NULL */ uprv_memset((void *)&tags[tagCount].aliases, 0, sizeof(tags[tagCount].aliases)); return tagCount++; } static void addTaggedAlias(uint16_t tag, const char *alias, uint16_t converter) { tags[tag].aliases[converter] = alias; } static uint16_t addAlias(const char *alias, uint16_t converter) { if(aliasCount>=MAX_ALIAS_COUNT) { fprintf(stderr, "gencnval: too many aliases\n"); exit(U_BUFFER_OVERFLOW_ERROR); } /* TODO: Check for duplicates */ aliases[aliasCount].alias = alias; aliases[aliasCount].converter = converter; converters[converter].aliasCount++; return aliasCount++; } static uint16_t addConverter(const char *converter) { if(converterCount>=MAX_ALIAS_COUNT) { fprintf(stderr, "gencnval: too many converters\n"); exit(U_BUFFER_OVERFLOW_ERROR); } /* TODO: Check for duplicates */ converters[converterCount].converter = converter; converters[converterCount].aliasCount = 0; return converterCount++; } static char * allocString(StringBlock *block, uint32_t length) { uint32_t top=block->top+length; char *p; if(top > block->max) { fprintf(stderr, "gencnval: out of memory\n"); exit(U_MEMORY_ALLOCATION_ERROR); } p = block->store + block->top; block->top = top; return p; } static int compareAliases(const void *alias1, const void *alias2) { return ucnv_compareNames(((Alias*)alias1)->alias, ((Alias*)alias2)->alias); } /* * Hey, Emacs, please set the following: * * Local Variables: * indent-tabs-mode: nil * End: * */