/* ********************************************************************** * Copyright (C) 1999, International Business Machines * Corporation and others. All Rights Reserved. ********************************************************************** * * * ucnv_bld.h: * Contains all internal and external data structure definitions * Created & Maitained by Bertrand A. Damiba * * * * ATTENTION: * --------- * Although the data structures in this file are open and stack allocatable * we reserve the right to hide them in further releases. * * Change history: * * 06/29/2000 helena Major rewrite of the callback APIs. */ #ifndef UCNV_BLD_H #define UCNV_BLD_H #include "unicode/utypes.h" #include "unicode/ucnv.h" #include "unicode/ucnv_err.h" /* ### move the following typedef and array into implementation files! */ typedef struct { int32_t ccsid; UChar mismapped; UChar replacement; } UAmbiguousConverter; static const UAmbiguousConverter UCNV_AMBIGUOUSCONVERTERS[UCNV_MAX_AMBIGUOUSCCSIDS] = { { 943, 0x00A5, 0x005C }, { 949, 0x20A9, 0x005C }, { 1361, 0x20A9, 0x005C }, { 942, 0x00A5, 0x005C }, { 1363, 0x20A9, 0x005C } }; U_CDECL_BEGIN /* We must declare the following as 'extern "C"' so that if ucnv itself is compiled under C++, the linkage of the funcptrs will work. */ union UConverterTable; typedef union UConverterTable UConverterTable; struct UConverterImpl; typedef struct UConverterImpl UConverterImpl; /* ### * Markus Scherer on 2000feb04: * I have change UConverter and UConverterSharedData; there may be more changes, * or we may decide to roll back the structure definitions to what they were * before, with the additional UConverterImpl field and the new semantics for * referenceCounter. * * Reasons for changes: Attempt at performance improvements, especially * a) decrease amount of internal, implicit padding by reordering the fields * b) save space by storing the internal name of the converter only with a * pointer instead of an array * * In addition to that, I added the UConverterImpl field for better * modularizing the code and making it more maintainable. It may actually * become slightly faster by doing this. * * I changed the UConverter.to|fromUnicodeStatus to be unsigned because * the defaultValues.toUnicodeStatus is unsigned, and it seemed to be a safer choice. * * Ultimately, I would prefer not to expose these definitions any more at all, * but this is suspect to discussions, proposals and design reviews. * * I would personally like to see more information hiding (with helper APIs), * useful state fields in UConverter that are reserved for the callbacks, * and directly included structures instead of pointers to allocated * memory, like for UConverterTable and its variant fields. * * Also, with the more C++-like converter implementation, * the conversionType does not need to be in UConverterSharedData any more: * it is in UConverterImpl and hardly used. */ typedef struct { uint32_t structSize; /* Size of this structure */ char name [UCNV_MAX_CONVERTER_NAME_LENGTH]; /* internal name of the converter- invariant chars */ int32_t codepage; /* codepage # (now IBM-$codepage) */ int8_t platform; /* platform of the converter (only IBM now) */ int8_t conversionType; /* conversion type */ int8_t minBytesPerChar; /* Minimum # bytes per char in this codepage */ int8_t maxBytesPerChar; /* Maximum # bytes per char in this codepage */ int8_t subCharLen; uint8_t subChar[UCNV_MAX_SUBCHAR_LEN]; uint8_t hasToUnicodeFallback; /* UBool needs to be changed to UBool to be consistent across platform */ uint8_t hasFromUnicodeFallback; uint8_t reserved[19]; /* to round out the structure */ } UConverterStaticData; /* * Defines the UConverterSharedData struct, * the immutable, shared part of UConverter. */ typedef struct { uint32_t structSize; /* Size of this structure */ uint32_t referenceCounter; /* used to count number of clients, 0xffffffff for static SharedData */ const void *dataMemory; /* from udata_openChoice() */ UConverterTable *table; /* Pointer to conversion data */ const UConverterStaticData *staticData; /* pointer to the static (non changing) data. */ UBool staticDataOwned; /* T if we own the staticData */ const UConverterImpl *impl; /* vtable-style struct of mostly function pointers */ /*initial values of some members of the mutable part of object */ uint32_t toUnicodeStatus; } UConverterSharedData; /* Defines a UConverter, the lightweight mutable part the user sees */ struct UConverter { uint32_t toUnicodeStatus; /* Used to internalize stream status information */ uint32_t fromUnicodeStatus; UChar fromUSurrogateLead; int32_t mode; UBool useFallback; int8_t subCharLen; /* length of the codepage specific character sequence */ int8_t invalidCharLength; int8_t invalidUCharLength; int8_t charErrorBufferLength; /* number of valid bytes in charErrorBuffer */ int8_t UCharErrorBufferLength; /* number of valid UChars in charErrorBuffer */ uint8_t subChar[UCNV_MAX_SUBCHAR_LEN]; /* codepage specific character sequence */ char invalidCharBuffer[UCNV_MAX_SUBCHAR_LEN]; uint8_t charErrorBuffer[UCNV_ERROR_BUFFER_LENGTH]; /* codepage output from Error functions */ UChar invalidUCharBuffer[3]; UChar UCharErrorBuffer[UCNV_ERROR_BUFFER_LENGTH]; /* unicode output from Error functions */ /* * Error function pointer called when conversion issues * occur during a ucnv_fromUnicode call */ void (*fromUCharErrorBehaviour) (void *context, UConverterFromUnicodeArgs *args, const UChar *codeUnits, int32_t length, UChar32 codePoint, UConverterCallbackReason reason, UErrorCode *); /* * Error function pointer called when conversion issues * occur during a T_UConverter_toUnicode call */ void (*fromCharErrorBehaviour) (void *context, UConverterToUnicodeArgs *args, const char *codeUnits, int32_t length, UConverterCallbackReason reason, UErrorCode *); void *fromUContext; void *toUContext; UConverterSharedData *sharedData; /* Pointer to the shared immutable part of the converter object */ /* * currently only used to point to a struct containing UConverter used by iso 2022; * could be used by clients writing their own call back function to pass context to them */ void *extraInfo; }; U_CDECL_END /* end of UConverter */ typedef struct { UConverter *currentConverter; uint8_t escSeq2022[10]; int8_t escSeq2022Length; } UConverterDataISO2022; typedef struct { UConverter *OptGrpConverter[0x20]; /* Converter per Opt. grp. */ uint8_t OptGroup; /* default Opt. grp. for this LMBCS session */ uint8_t localeConverterIndex; /* reasonable locale match for index */ } UConverterDataLMBCS; #define CONVERTER_FILE_EXTENSION ".cnv" #endif /* _UCNV_BLD */