/* ******************************************************************************* * * Copyright (C) 1999, International Business Machines * Corporation and others. All Rights Reserved. * ******************************************************************************* * file name: gencmn.c * encoding: US-ASCII * tab size: 8 (not used) * indentation:4 * * created on: 1999nov01 * created by: Markus W. Scherer * * This program reads a list of data files and combines them * into one common, memory-mappable file. */ #include #include #include "unicode/utypes.h" #include "unicode/putil.h" #include "cmemory.h" #include "cstring.h" #include "filestrm.h" #include "toolutil.h" #include "unewdata.h" #include "uoptions.h" #define STRING_STORE_SIZE 100000 #define MAX_FILE_COUNT 2000 #define COMMON_DATA_NAME U_ICUDATA_NAME #define DATA_TYPE "dat" /* UDataInfo cf. udata.h */ static const UDataInfo dataInfo={ sizeof(UDataInfo), 0, U_IS_BIG_ENDIAN, U_CHARSET_FAMILY, sizeof(UChar), 0, 0x43, 0x6d, 0x6e, 0x44, /* dataFormat="CmnD" */ 1, 0, 0, 0, /* formatVersion */ 3, 0, 0, 0 /* dataVersion */ }; static uint32_t maxSize; static char stringStore[STRING_STORE_SIZE]; static uint32_t stringTop=0, basenameTotal=0; typedef struct { char *pathname, *basename; uint32_t basenameLength, basenameOffset, fileSize, fileOffset; } File; static File files[MAX_FILE_COUNT]; static uint32_t fileCount=0; /* prototypes --------------------------------------------------------------- */ static void addFile(const char *filename, UBool sourceTOC); static char * allocString(uint32_t length); static int compareFiles(const void *file1, const void *file2); /* -------------------------------------------------------------------------- */ static UOption options[]={ /*0*/ UOPTION_HELP_H, /*1*/ UOPTION_HELP_QUESTION_MARK, /*2*/ UOPTION_VERBOSE, /*3*/ UOPTION_COPYRIGHT, /*4*/ UOPTION_DESTDIR, /*5*/ UOPTION_DEF( "comment", 'C', UOPT_REQUIRES_ARG), /*6*/ UOPTION_DEF( "name", 'n', UOPT_REQUIRES_ARG), /*7*/ UOPTION_DEF( "type", 't', UOPT_REQUIRES_ARG), /*8*/ UOPTION_DEF( "source", 'S', UOPT_NO_ARG), /*9*/ UOPTION_DEF( "entrypoint", 'e', UOPT_REQUIRES_ARG) }; char symPrefix[100]; extern int main(int argc, char* argv[]) { static uint8_t buffer[4096]; char line[512]; FileStream *in, *file; UNewDataMemory *out; char *s; UErrorCode errorCode=U_ZERO_ERROR; uint32_t i, fileOffset, basenameOffset, length; UBool sourceTOC; const char *entrypointName = NULL; /* preset then read command line options */ options[4].value=u_getDataDirectory(); options[6].value=COMMON_DATA_NAME; options[7].value=DATA_TYPE; argc=u_parseArgs(argc, argv, sizeof(options)/sizeof(options[0]), options); #ifndef U_HAVE_BIND_INTERNAL_REFERENCES /* if it is ICU data.. no prefix. */ if(!uprv_strcmp(options[6].value, COMMON_DATA_NAME)) { symPrefix[0] = 0; } else { uprv_strcpy(symPrefix, options[6].value); uprv_strcat(symPrefix, "_"); } #else symPrefix[0] = 0; #endif /* error handling, printing usage message */ if(argc<0) { fprintf(stderr, "error in command line argument \"%s\"\n", argv[-argc]); } else if(argc<2) { argc=-1; } if(argc<0 || options[0].doesOccur || options[1].doesOccur) { fprintf(stderr, "usage: %s [-options] maxsize [list-filename]\n" "\tread the list file (default: stdin) and \n" "\tcreate a common data file from all the files listed but each not larger than maxsize\n" "\toptions:\n" "\t\t-h or -? or --help this usage text\n" "\t\t-v or --verbose verbose output\n" "\t\t-c or --copyright include the ICU copyright notice\n" "\t\t-C or --comment include a comment string\n" "\t\t-d or --destdir destination directory, followed by the path\n" "\t\t-n or --name name of the destination file, defaults to " COMMON_DATA_NAME "\n" "\t\t-t or --type type of the destination file, defaults to " DATA_TYPE "\n" "\t\t-S or --source write a .c source file with the table of contents\n", "\t\t-e or --entrypoint override the c entrypoint name (default: _ )", argv[0]); return argc<0 ? U_ILLEGAL_ARGUMENT_ERROR : U_ZERO_ERROR; } sourceTOC=options[8].doesOccur; maxSize=uprv_strtoul(argv[1], NULL, 0); if(maxSize==0 && !sourceTOC) { fprintf(stderr, "gencmn: maxSize %s not valid\n", argv[1]); exit(U_ILLEGAL_ARGUMENT_ERROR); } if(argc==2) { in=T_FileStream_stdin(); } else { in=T_FileStream_open(argv[2], "r"); if(in==NULL) { fprintf(stderr, "gencmn: unable to open input file %s\n", argv[2]); exit(U_FILE_ACCESS_ERROR); } } if(sourceTOC) { printf("Generating %s_%s.c Table of Contents source file\n", options[6].value, options[7].value); } else { printf("Generating %s.%s common data file with Table of Contents\n", options[6].value, options[7].value); } /* read the list of files and get their lengths */ while(T_FileStream_readLine(in, line, sizeof(line))!=NULL) { /* remove trailing newline characters */ s=line; while(*s!=0) { if(*s=='\r' || *s=='\n') { *s=0; break; } ++s; } addFile(getLongPathname(line), sourceTOC); } if(in!=T_FileStream_stdin()) { T_FileStream_close(in); } if(fileCount==0) { printf("gencmn: no files listed in %s\n", argc==2 ? "" : argv[2]); return 0; } /* sort the files by basename */ qsort(files, fileCount, sizeof(File), compareFiles); if(!sourceTOC) { /* determine the offsets of all basenames and files in this common one */ basenameOffset=4+8*fileCount; fileOffset=basenameOffset+(basenameTotal+15)&~0xf; for(i=0; ifilename && *(s-1)!=U_FILE_SEP_CHAR) { *s++=U_FILE_SEP_CHAR; } uprv_strcpy(s, options[6].value); if(*(options[7].value)!=0) { s+=uprv_strlen(s); *s++='_'; uprv_strcpy(s, options[7].value); } s+=uprv_strlen(s); uprv_strcpy(s, ".c"); /* open the output file */ out=T_FileStream_open(filename, "w"); if(out==NULL) { fprintf(stderr, "gencmn: unable to open .c output file %s\n", filename); exit(U_FILE_ACCESS_ERROR); } /* write the source file */ sprintf(buffer, "/*\n" " * ICU common data table of contents for %s.%s ,\n" " * Automatically generated by icu/source/tools/gencmn/gencmn .\n" " */\n\n" "#include \"unicode/utypes.h\"\n" "#include \"unicode/udata.h\"\n" "\n" "/* external symbol declarations for data */\n", options[6].value, options[7].value); T_FileStream_writeLine(out, buffer); sprintf(buffer, "extern const char\n %s%s[]", symPrefix, files[0].pathname); T_FileStream_writeLine(out, buffer); for(i=1; imaxSize) { return; } files[fileCount].fileSize=length; } else { char *t; /* get and store the basename */ filename=findBasename(filename); length=uprv_strlen(filename)+1; s=allocString(length); uprv_memcpy(s, filename, length); files[fileCount].basename=s; /* turn the basename into an entry point name and store in the pathname field */ t=files[fileCount].pathname=allocString(length); while(--length>0) { if(*s=='.' || *s=='-') { *t='_'; } else { *t=*s; } ++s; ++t; } *t=0; } ++fileCount; } static char * allocString(uint32_t length) { uint32_t top=stringTop+length; char *p; if(top>STRING_STORE_SIZE) { fprintf(stderr, "gencmn: out of memory\n"); exit(U_MEMORY_ALLOCATION_ERROR); } p=stringStore+stringTop; stringTop=top; return p; } static int compareFiles(const void *file1, const void *file2) { /* sort by basename */ return uprv_strcmp(((File *)file1)->basename, ((File *)file2)->basename); } /* * Hey, Emacs, please set the following: * * Local Variables: * indent-tabs-mode: nil * End: * */