463391f84e
X-SVN-Rev: 4242
400 lines
9.7 KiB
C
400 lines
9.7 KiB
C
/*
|
|
******************************************************************************
|
|
*
|
|
* Copyright (C) 1998-2001, International Business Machines
|
|
* Corporation and others. All Rights Reserved.
|
|
*
|
|
******************************************************************************
|
|
*
|
|
* File ustdio.c
|
|
*
|
|
* Modification History:
|
|
*
|
|
* Date Name Description
|
|
* 11/18/98 stephen Creation.
|
|
* 03/12/99 stephen Modified for new C API.
|
|
* 07/19/99 stephen Fixed read() and gets()
|
|
******************************************************************************
|
|
*/
|
|
|
|
#include "unicode/ustdio.h"
|
|
#include "unicode/putil.h"
|
|
#include "ufile.h"
|
|
#include "ufmt_cmn.h"
|
|
#include "unicode/ucnv.h"
|
|
#include "unicode/ustring.h"
|
|
|
|
#include <string.h>
|
|
|
|
static const UChar DELIMITERS [] = { 0x000A, 0x0000 };
|
|
|
|
#define DELIM_CR 0x000D
|
|
#define DELIM_LF 0x000A
|
|
|
|
#define IS_STRING_DELIMITER(s) (UBool)( (s) == DELIM_CR || \
|
|
(s) == DELIM_LF )
|
|
|
|
|
|
/* Input/output */
|
|
|
|
int32_t
|
|
u_fputs(const UChar *s,
|
|
UFILE *f)
|
|
{
|
|
int32_t count = u_file_write(s, u_strlen(s), f);
|
|
count += u_file_write(DELIMITERS, u_strlen(DELIMITERS), f);
|
|
return count;
|
|
}
|
|
|
|
int32_t
|
|
u_fputc(UChar uc,
|
|
UFILE *f)
|
|
{
|
|
return u_file_write(&uc, 1, f) == 1 ? uc : EOF;
|
|
}
|
|
|
|
int32_t
|
|
u_file_write( const UChar *chars,
|
|
int32_t count,
|
|
UFILE *f)
|
|
{
|
|
/* Set up conversion parameters */
|
|
UErrorCode status = U_ZERO_ERROR;
|
|
const UChar *mySource = chars;
|
|
const UChar *sourceAlias = chars;
|
|
const UChar *mySourceEnd = chars + count;
|
|
char *myTarget = f->fCharBuffer;
|
|
int32_t bufferSize = UFILE_CHARBUFFER_SIZE;
|
|
int32_t written = 0;
|
|
|
|
/* Perform the conversion in a loop */
|
|
do {
|
|
status = U_ZERO_ERROR;
|
|
sourceAlias = mySource;
|
|
if(f->fConverter != NULL) { /* We have a valid converter */
|
|
ucnv_fromUnicode(f->fConverter,
|
|
&myTarget,
|
|
f->fCharBuffer + bufferSize,
|
|
&mySource,
|
|
mySourceEnd,
|
|
NULL,
|
|
FALSE, /* TODO: This must be true when we are closing the file */
|
|
&status);
|
|
} else { /*weiv: do the invariant conversion */
|
|
u_UCharsToChars(mySource, myTarget, count);
|
|
myTarget += count;
|
|
}
|
|
|
|
/* write the converted bytes */
|
|
fwrite(f->fCharBuffer,
|
|
sizeof(char),
|
|
myTarget - f->fCharBuffer,
|
|
f->fFile);
|
|
|
|
written += (myTarget - f->fCharBuffer);
|
|
myTarget = f->fCharBuffer;
|
|
}
|
|
while(status == U_BUFFER_OVERFLOW_ERROR);
|
|
|
|
/* return # of chars written */
|
|
return written;
|
|
}
|
|
|
|
/* private function used for buffering input */
|
|
void
|
|
ufile_fill_uchar_buffer(UFILE *f)
|
|
{
|
|
UErrorCode status;
|
|
const char *mySource;
|
|
const char *mySourceEnd;
|
|
UChar *myTarget;
|
|
int32_t bufferSize;
|
|
int32_t maxCPBytes;
|
|
int32_t bytesRead;
|
|
int32_t availLength;
|
|
int32_t dataSize;
|
|
|
|
|
|
/* shift the buffer if it isn't empty */
|
|
dataSize = f->fUCLimit - f->fUCPos;
|
|
if(dataSize != 0) {
|
|
memmove(f->fUCBuffer,
|
|
f->fUCPos,
|
|
dataSize * sizeof(UChar));
|
|
}
|
|
|
|
|
|
/* record how much buffer space is available */
|
|
availLength = UFILE_UCHARBUFFER_SIZE - dataSize;
|
|
|
|
/* Determine the # of codepage bytes needed to fill our UChar buffer */
|
|
/* weiv: if converter is NULL, we use invariant converter with charwidth = 1)*/
|
|
maxCPBytes = availLength / (f->fConverter!=NULL?(2*ucnv_getMinCharSize(f->fConverter)):1);
|
|
|
|
/* Read in the data to convert */
|
|
bytesRead = fread(f->fCharBuffer,
|
|
sizeof(char),
|
|
ufmt_min(maxCPBytes, UFILE_CHARBUFFER_SIZE),
|
|
f->fFile);
|
|
|
|
/* Set up conversion parameters */
|
|
status = U_ZERO_ERROR;
|
|
mySource = f->fCharBuffer;
|
|
mySourceEnd = f->fCharBuffer + bytesRead;
|
|
myTarget = f->fUCBuffer + dataSize;
|
|
bufferSize = UFILE_UCHARBUFFER_SIZE;
|
|
|
|
if(f->fConverter != NULL) { /* We have a valid converter */
|
|
/* Perform the conversion */
|
|
ucnv_toUnicode(f->fConverter,
|
|
&myTarget,
|
|
f->fUCBuffer + bufferSize,
|
|
&mySource,
|
|
mySourceEnd,
|
|
NULL,
|
|
(UBool)(feof(f->fFile) != 0),
|
|
&status);
|
|
|
|
} else { /*weiv: do the invariant conversion */
|
|
u_charsToUChars(mySource, myTarget, bytesRead);
|
|
myTarget += bytesRead;
|
|
}
|
|
|
|
/* update the pointers into our array */
|
|
f->fUCPos = f->fUCBuffer;
|
|
f->fUCLimit = myTarget;
|
|
}
|
|
|
|
UChar*
|
|
u_fgets(UFILE *f,
|
|
int32_t n,
|
|
UChar *s)
|
|
{
|
|
int32_t dataSize;
|
|
int32_t read;
|
|
int32_t count;
|
|
UChar *alias;
|
|
|
|
|
|
/* fill the buffer */
|
|
ufile_fill_uchar_buffer(f);
|
|
|
|
/* subtract 1 from n to compensate for the terminator */
|
|
--n;
|
|
|
|
/* determine the amount of data in the buffer */
|
|
dataSize = f->fUCLimit - f->fUCPos;
|
|
|
|
/* if the buffer contains more data than requested, operate on the buffer */
|
|
if(dataSize > n) {
|
|
|
|
/* find the first occurrence of a delimiter character */
|
|
alias = f->fUCPos;
|
|
count = 0;
|
|
while( ! IS_STRING_DELIMITER(*alias) && count < n) {
|
|
++count;
|
|
alias++;
|
|
}
|
|
|
|
/* copy the characters into the target*/
|
|
memcpy(s, f->fUCPos, count * sizeof(UChar));
|
|
|
|
/* add the terminator */
|
|
s[count] = 0x0000;
|
|
|
|
/* update the current buffer position */
|
|
f->fUCPos += count;
|
|
|
|
/* refill the buffer */
|
|
ufile_fill_uchar_buffer(f);
|
|
|
|
/* skip over any remaining delimiters */
|
|
while(IS_STRING_DELIMITER(*(f->fUCPos)) && f->fUCPos < f->fUCLimit)
|
|
(f->fUCPos)++;
|
|
|
|
/* return s */
|
|
return s;
|
|
}
|
|
|
|
/* otherwise, iteratively fill the buffer and copy */
|
|
read = 0;
|
|
do {
|
|
|
|
/* determine the amount of data in the buffer */
|
|
dataSize = f->fUCLimit - f->fUCPos;
|
|
|
|
/* find the first occurrence of a delimiter character, if present */
|
|
alias = f->fUCPos;
|
|
count = 0;
|
|
while( ! IS_STRING_DELIMITER(*alias) && alias < f->fUCLimit && count < n) {
|
|
++count;
|
|
alias++;
|
|
}
|
|
|
|
/* copy the current data in the buffer */
|
|
memcpy(s + read, f->fUCPos, count * sizeof(UChar));
|
|
|
|
/* update number of items read */
|
|
read += count;
|
|
|
|
/* update the current buffer position */
|
|
f->fUCPos += count;
|
|
|
|
/* if we found a delimiter */
|
|
if(alias < f->fUCLimit) {
|
|
|
|
/* refill the buffer */
|
|
ufile_fill_uchar_buffer(f);
|
|
|
|
/* skip over any remaining delimiters */
|
|
while(IS_STRING_DELIMITER(*(f->fUCPos)) && f->fUCPos < f->fUCLimit)
|
|
(f->fUCPos)++;
|
|
|
|
/* break out */
|
|
break;
|
|
}
|
|
|
|
/* refill the buffer */
|
|
ufile_fill_uchar_buffer(f);
|
|
|
|
} while(dataSize != 0 && read < n);
|
|
|
|
/* if 0 characters were read, return 0 */
|
|
if(read == 0)
|
|
return 0;
|
|
|
|
/* add the terminator and return s */
|
|
s[read] = 0x0000;
|
|
return s;
|
|
}
|
|
|
|
UChar
|
|
u_fgetc(UFILE *f)
|
|
{
|
|
/* if we have an available character in the buffer, return it */
|
|
if(f->fUCPos < f->fUCLimit)
|
|
return *(f->fUCPos)++;
|
|
/* otherwise, fill the buffer and return the next character */
|
|
else {
|
|
ufile_fill_uchar_buffer(f);
|
|
if(f->fUCPos < f->fUCLimit)
|
|
return *(f->fUCPos)++;
|
|
else
|
|
return 0xFFFF;
|
|
}
|
|
}
|
|
|
|
/* u_unescapeAt() callback to return a UChar from a UFILE */
|
|
static UChar _charAt(int32_t offset, void *context) {
|
|
return ((UFILE*) context)->fUCPos[offset];
|
|
}
|
|
|
|
/* Read a UChar from a UFILE and process escape sequences */
|
|
UChar32
|
|
u_fgetcx(UFILE *f) {
|
|
int32_t length;
|
|
int32_t offset;
|
|
UChar32 c32;
|
|
UChar c16;
|
|
|
|
/* Fill the buffer if it is empty */
|
|
if (f->fUCPos >= f->fUCLimit) {
|
|
ufile_fill_uchar_buffer(f);
|
|
}
|
|
|
|
/* Get the next character in the buffer */
|
|
if (f->fUCPos < f->fUCLimit) {
|
|
c16 = *(f->fUCPos)++;
|
|
} else {
|
|
c16 = U_EOF;
|
|
}
|
|
|
|
/* If it isn't a backslash, return it */
|
|
if (c16 != 0x005C /*'\\'*/) {
|
|
return c16;
|
|
}
|
|
|
|
/* Determine the amount of data in the buffer */
|
|
length = f->fUCLimit - f->fUCPos;
|
|
|
|
/* The longest escape sequence is \Uhhhhhhhh; make sure
|
|
we have at least that many characters */
|
|
if (length < 10) {
|
|
/* fill the buffer */
|
|
ufile_fill_uchar_buffer(f);
|
|
length = f->fUCLimit - f->fUCPos;
|
|
}
|
|
|
|
/* Process the escape */
|
|
offset = 0;
|
|
c32 = u_unescapeAt(_charAt, &offset, length, (void*)f);
|
|
|
|
/* Update the current buffer position */
|
|
f->fUCPos += offset;
|
|
|
|
return c32;
|
|
}
|
|
|
|
UChar
|
|
u_fungetc(UChar c,
|
|
UFILE *f)
|
|
{
|
|
/* if we're at the beginning of the buffer, sorry! */
|
|
if(f->fUCPos == f->fUCBuffer)
|
|
return 0xFFFF;
|
|
/* otherwise, put the character back */
|
|
else {
|
|
*--(f->fUCPos) = c;
|
|
return c;
|
|
}
|
|
}
|
|
|
|
int32_t
|
|
u_file_read( UChar *chars,
|
|
int32_t count,
|
|
UFILE *f)
|
|
{
|
|
int32_t dataSize;
|
|
int32_t read;
|
|
|
|
/* fill the buffer */
|
|
ufile_fill_uchar_buffer(f);
|
|
|
|
/* determine the amount of data in the buffer */
|
|
dataSize = f->fUCLimit - f->fUCPos;
|
|
|
|
/* if the buffer contains the amount requested, just copy */
|
|
if(dataSize > count) {
|
|
memcpy(chars, f->fUCPos, count * sizeof(UChar));
|
|
|
|
/* update the current buffer position */
|
|
f->fUCPos += count;
|
|
|
|
/* return # of chars read */
|
|
return count;
|
|
}
|
|
|
|
/* otherwise, iteratively fill the buffer and copy */
|
|
read = 0;
|
|
do {
|
|
|
|
/* determine the amount of data in the buffer */
|
|
dataSize = f->fUCLimit - f->fUCPos;
|
|
|
|
/* copy the current data in the buffer */
|
|
memcpy(chars + read, f->fUCPos, dataSize * sizeof(UChar));
|
|
|
|
/* update number of items read */
|
|
read += dataSize;
|
|
|
|
/* update the current buffer position */
|
|
f->fUCPos += dataSize;
|
|
|
|
/* refill the buffer */
|
|
ufile_fill_uchar_buffer(f);
|
|
|
|
} while(dataSize != 0 && read < count);
|
|
|
|
return read;
|
|
}
|