scuffed-code/icu4c/source/tools/genprops/misc/ucdstrip.c

/*
*******************************************************************************
*
*   Copyright (C) 2003, International Business Machines
*   Corporation and others.  All Rights Reserved.
*
*******************************************************************************
*   file name:  ucdstrip.c
*   encoding:   US-ASCII
*   tab size:   8 (not used)
*   indentation:4
*
*   created on: 2003feb20
*   created by: Markus W. Scherer
*
*   Simple tool for Unicode Character Database files with semicolon-delimited fields.
*   Removes comments behind data lines but not in others.
*
*   To compile, just call a C compiler/linker with this source file.
*   On Windows: cl ucdstrip.c
*/

#include <stdio.h>
#include <string.h>
#include <stdlib.h>

/* return the first character position after the end of the data */
static char *
endOfData(const char *l) {
    char *end;
    char c;

    end=strchr(l, '#');
    if(end!=NULL) {
        /* ignore whitespace before the comment */
        while(l!=end && ((c=*(end-1))==' ' || c=='\t')) {
            --end;
        }
    } else {
        end=strchr(l, 0);
    }
    return end;
}

extern int
main(int argc, const char *argv[]) {
    static char line[2000];
    char *end;

    while(gets(line)!=NULL) {
        if(strtol(line, &end, 16)>=0 && end!=line) {
            /* code point or range followed by semicolon and data, remove comment */
            *endOfData(line)=0;
        }
        puts(line);
    }

    return 0;
}
ICU-2427 add UCD tools X-SVN-Rev: 11138 2003-02-21 16:17:42 +00:00			`/*`
			`*******************************************************************************`
			`*`
			`* Copyright (C) 2003, International Business Machines`
			`* Corporation and others. All Rights Reserved.`
			`*`
			`*******************************************************************************`
			`* file name: ucdstrip.c`
			`* encoding: US-ASCII`
			`* tab size: 8 (not used)`
			`* indentation:4`
			`*`
			`* created on: 2003feb20`
			`* created by: Markus W. Scherer`
			`*`
			`* Simple tool for Unicode Character Database files with semicolon-delimited fields.`
			`* Removes comments behind data lines but not in others.`
			`*`
			`* To compile, just call a C compiler/linker with this source file.`
			`* On Windows: cl ucdstrip.c`
			`*/`

			`#include <stdio.h>`
			`#include <string.h>`
			`#include <stdlib.h>`

			`/* return the first character position after the end of the data */`
			`static char *`
			`endOfData(const char *l) {`
			`char *end;`
			`char c;`

			`end=strchr(l, '#');`
			`if(end!=NULL) {`
			`/* ignore whitespace before the comment */`
			`while(l!=end && ((c=*(end-1))==' ' \|\| c=='\t')) {`
			`--end;`
			`}`
			`} else {`
			`end=strchr(l, 0);`
			`}`
			`return end;`
			`}`

			`extern int`
			`main(int argc, const char *argv[]) {`
			`static char line[2000];`
			`char *end;`

			`while(gets(line)!=NULL) {`
			`if(strtol(line, &end, 16)>=0 && end!=line) {`
			`/* code point or range followed by semicolon and data, remove comment */`
			`*endOfData(line)=0;`
			`}`
			`puts(line);`
			`}`

			`return 0;`
			`}`