/* ******************************************************************************* * * Copyright (C) 1999-2001, International Business Machines * Corporation and others. All Rights Reserved. * ******************************************************************************* * file name: gencmn.c * encoding: US-ASCII * tab size: 8 (not used) * indentation:4 * * created on: 1999nov01 * created by: Markus W. Scherer * * This program reads a list of data files and combines them * into one common, memory-mappable file. */ #include #include #include "unicode/utypes.h" #include "unicode/putil.h" #include "cmemory.h" #include "cstring.h" #include "filestrm.h" #include "toolutil.h" #include "unewdata.h" #include "uoptions.h" #define STRING_STORE_SIZE 100000 #define MAX_FILE_COUNT 2000 #define COMMON_DATA_NAME U_ICUDATA_NAME #define DATA_TYPE "dat" /* UDataInfo cf. udata.h */ static const UDataInfo dataInfo={ sizeof(UDataInfo), 0, U_IS_BIG_ENDIAN, U_CHARSET_FAMILY, sizeof(UChar), 0, {0x43, 0x6d, 0x6e, 0x44}, /* dataFormat="CmnD" */ {1, 0, 0, 0}, /* formatVersion */ {3, 0, 0, 0} /* dataVersion */ }; static uint32_t maxSize; static char stringStore[STRING_STORE_SIZE]; static uint32_t stringTop=0, basenameTotal=0; typedef struct { char *pathname, *basename; uint32_t basenameLength, basenameOffset, fileSize, fileOffset; } File; static File files[MAX_FILE_COUNT]; static uint32_t fileCount=0; /* prototypes --------------------------------------------------------------- */ static void addFile(const char *filename, UBool sourceTOC, UBool verbose); static char * allocString(uint32_t length); static int compareFiles(const void *file1, const void *file2); /* -------------------------------------------------------------------------- */ static UOption options[]={ /*0*/ UOPTION_HELP_H, /*1*/ UOPTION_HELP_QUESTION_MARK, /*2*/ UOPTION_VERBOSE, /*3*/ UOPTION_COPYRIGHT, /*4*/ UOPTION_DESTDIR, /*5*/ UOPTION_DEF( "comment", 'C', UOPT_REQUIRES_ARG), /*6*/ UOPTION_DEF( "name", 'n', UOPT_REQUIRES_ARG), /*7*/ UOPTION_DEF( "type", 't', UOPT_REQUIRES_ARG), /*8*/ UOPTION_DEF( "source", 'S', UOPT_NO_ARG), /*9*/ UOPTION_DEF( "entrypoint", 'e', UOPT_REQUIRES_ARG) }; char symPrefix[100]; extern int main(int argc, char* argv[]) { static char buffer[4096]; char line[512]; FileStream *in, *file; char *s; UErrorCode errorCode=U_ZERO_ERROR; uint32_t i, fileOffset, basenameOffset, length, nread; UBool sourceTOC, verbose; const char *entrypointName = NULL; /* preset then read command line options */ options[4].value=u_getDataDirectory(); options[6].value=COMMON_DATA_NAME; options[7].value=DATA_TYPE; argc=u_parseArgs(argc, argv, sizeof(options)/sizeof(options[0]), options); #ifndef U_HAVE_BIND_INTERNAL_REFERENCES /* if it is ICU data.. no prefix. */ if(!uprv_strcmp(options[6].value, COMMON_DATA_NAME)) { symPrefix[0] = 0; } else { uprv_strcpy(symPrefix, options[6].value); uprv_strcat(symPrefix, "_"); } #else symPrefix[0] = 0; #endif /* error handling, printing usage message */ if(argc<0) { fprintf(stderr, "error in command line argument \"%s\"\n", argv[-argc]); } else if(argc<2) { argc=-1; } if(argc<0 || options[0].doesOccur || options[1].doesOccur) { /* * Broken into chucks because the C89 standard says the minimum * required supported string length is 509 bytes. */ fprintf(stderr, "usage: %s [-options] maxsize [list-filename]\n" "\n" "Read the list file (default: stdin) and \n" "create a common data file from specified files; omit any larger than maxsize\n" "\n", argv[0]); fprintf(stderr, " option parameter description\n" " ---------------------------------------------------------------------------\n" " -h or -? or --help this usage text\n" " -v or --verbose verbose output\n" " -c or --copyright include the ICU copyright notice\n" " -C or --comment \"text\" include a comment string\n" " -d or --destdir dir destination directory\n"); fprintf(stderr, " -n or --name file-name output file name, without .type extension\n" " defaults to " COMMON_DATA_NAME "\n" " -t or --type file-type type of the destination file\n" " defaults to \"" DATA_TYPE "\"\n" " -S or --source toc-file write a .c source file with the table of contents\n" " -e or --entrypoint name override the c entrypoint name\n" " defaults to \"_\" "); return argc<0 ? U_ILLEGAL_ARGUMENT_ERROR : U_ZERO_ERROR; } sourceTOC=options[8].doesOccur; verbose = options[2].doesOccur; maxSize=(uint32_t)uprv_strtoul(argv[1], NULL, 0); if(argc==2) { in=T_FileStream_stdin(); } else { in=T_FileStream_open(argv[2], "r"); if(in==NULL) { fprintf(stderr, "gencmn: unable to open input file %s\n", argv[2]); exit(U_FILE_ACCESS_ERROR); } } if (verbose) { if(sourceTOC) { printf("generating %s_%s.c (table of contents source file)\n", options[6].value, options[7].value); } else { printf("generating %s.%s (common data file with table of contents)\n", options[6].value, options[7].value); } } /* read the list of files and get their lengths */ while(T_FileStream_readLine(in, line, sizeof(line))!=NULL) { /* remove trailing newline characters */ s=line; while(*s!=0) { if(*s=='\r' || *s=='\n') { *s=0; break; } ++s; } /* check for comment */ if (*line == '#') { continue; } /* add the file */ addFile(getLongPathname(line), sourceTOC, verbose); } if(in!=T_FileStream_stdin()) { T_FileStream_close(in); } if(fileCount==0) { fprintf(stderr, "gencmn: no files listed in %s\n", argc==2 ? "" : argv[2]); return 0; } /* sort the files by basename */ qsort(files, fileCount, sizeof(File), compareFiles); if(!sourceTOC) { UNewDataMemory *out; /* determine the offsets of all basenames and files in this common one */ basenameOffset=4+8*fileCount; fileOffset=(basenameOffset+(basenameTotal+15))&~0xf; for(i=0; ifilename && *(s-1)!=U_FILE_SEP_CHAR) { *s++=U_FILE_SEP_CHAR; } uprv_strcpy(s, options[6].value); if(*(options[7].value)!=0) { s+=uprv_strlen(s); *s++='_'; uprv_strcpy(s, options[7].value); } s+=uprv_strlen(s); uprv_strcpy(s, ".c"); /* open the output file */ out=T_FileStream_open(filename, "w"); if(out==NULL) { fprintf(stderr, "gencmn: unable to open .c output file %s\n", filename); exit(U_FILE_ACCESS_ERROR); } /* write the source file */ sprintf(buffer, "/*\n" " * ICU common data table of contents for %s.%s ,\n" " * Automatically generated by icu/source/tools/gencmn/gencmn .\n" " */\n\n" "#include \"unicode/utypes.h\"\n" "#include \"unicode/udata.h\"\n" "\n" "/* external symbol declarations for data */\n", options[6].value, options[7].value); T_FileStream_writeLine(out, buffer); sprintf(buffer, "extern const char\n %s%s[]", symPrefix, files[0].pathname); T_FileStream_writeLine(out, buffer); for(i=1; imaxSize) { if (verbose) { printf("%s ignored (size %ld > %ld)\n", length, maxSize); } return; } files[fileCount].fileSize=length; } else { char *t; /* get and store the basename */ filename=findBasename(filename); length=uprv_strlen(filename)+1; s=allocString(length); uprv_memcpy(s, filename, length); files[fileCount].basename=s; /* turn the basename into an entry point name and store in the pathname field */ t=files[fileCount].pathname=allocString(length); while(--length>0) { if(*s=='.' || *s=='-') { *t='_'; } else { *t=*s; } ++s; ++t; } *t=0; } ++fileCount; } static char * allocString(uint32_t length) { uint32_t top=stringTop+length; char *p; if(top>STRING_STORE_SIZE) { fprintf(stderr, "gencmn: out of memory\n"); exit(U_MEMORY_ALLOCATION_ERROR); } p=stringStore+stringTop; stringTop=top; return p; } static int compareFiles(const void *file1, const void *file2) { /* sort by basename */ return uprv_strcmp(((File *)file1)->basename, ((File *)file2)->basename); } /* * Hey, Emacs, please set the following: * * Local Variables: * indent-tabs-mode: nil * End: * */