2002-02-25 18:44:07 +00:00
|
|
|
/*
|
|
|
|
*******************************************************************************
|
|
|
|
*
|
2008-08-04 21:56:02 +00:00
|
|
|
* Copyright (C) 2002-2008, International Business Machines
|
2002-02-25 18:44:07 +00:00
|
|
|
* Corporation and others. All Rights Reserved.
|
|
|
|
*
|
|
|
|
*******************************************************************************
|
|
|
|
* file name: propsvec.h
|
|
|
|
* encoding: US-ASCII
|
|
|
|
* tab size: 8 (not used)
|
|
|
|
* indentation:4
|
|
|
|
*
|
|
|
|
* created on: 2002feb22
|
|
|
|
* created by: Markus W. Scherer
|
|
|
|
*
|
|
|
|
* Store additional Unicode character properties in bit set vectors.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef __UPROPSVEC_H__
|
|
|
|
#define __UPROPSVEC_H__
|
|
|
|
|
|
|
|
#include "unicode/utypes.h"
|
|
|
|
#include "utrie.h"
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Unicode Properties Vectors associated with code point ranges.
|
|
|
|
* Stored in an array of uint32_t.
|
|
|
|
*
|
|
|
|
* The array starts with a header, then rows of integers store
|
|
|
|
* the range limits and the properties vectors.
|
|
|
|
*
|
|
|
|
* In each row, row[0] contains the start code point and
|
|
|
|
* row[1] contains the limit code point,
|
|
|
|
* which is the start of the next range.
|
|
|
|
*
|
|
|
|
* Initially, there is only one range [0..0x110000[ with values 0.
|
|
|
|
*
|
|
|
|
* It would be possible to store only one range boundary per row,
|
|
|
|
* but self-contained rows allow to later sort them by contents.
|
|
|
|
*/
|
|
|
|
enum {
|
2004-08-30 22:11:48 +00:00
|
|
|
/* stores number of columns, plus two for start & limit values */
|
2002-02-25 18:44:07 +00:00
|
|
|
UPVEC_COLUMNS,
|
|
|
|
UPVEC_MAXROWS,
|
|
|
|
UPVEC_ROWS,
|
2004-08-30 22:11:48 +00:00
|
|
|
/* search optimization: remember last row seen */
|
|
|
|
UPVEC_PREV_ROW,
|
2002-02-25 18:44:07 +00:00
|
|
|
UPVEC_HEADER_LENGTH
|
|
|
|
};
|
|
|
|
|
2004-08-30 22:11:48 +00:00
|
|
|
U_CAPI uint32_t * U_EXPORT2
|
2002-02-25 18:44:07 +00:00
|
|
|
upvec_open(int32_t columns, int32_t maxRows);
|
|
|
|
|
2004-08-30 22:11:48 +00:00
|
|
|
U_CAPI void U_EXPORT2
|
2002-02-25 18:44:07 +00:00
|
|
|
upvec_close(uint32_t *pv);
|
|
|
|
|
2004-08-30 22:11:48 +00:00
|
|
|
U_CAPI UBool U_EXPORT2
|
2002-02-25 18:44:07 +00:00
|
|
|
upvec_setValue(uint32_t *pv,
|
2004-08-30 22:11:48 +00:00
|
|
|
UChar32 start, UChar32 limit,
|
2002-02-25 18:44:07 +00:00
|
|
|
int32_t column,
|
|
|
|
uint32_t value, uint32_t mask,
|
|
|
|
UErrorCode *pErrorCode);
|
|
|
|
|
2004-08-30 22:11:48 +00:00
|
|
|
U_CAPI uint32_t U_EXPORT2
|
|
|
|
upvec_getValue(uint32_t *pv, UChar32 c, int32_t column);
|
|
|
|
|
|
|
|
/*
|
|
|
|
* pRangeStart and pRangeLimit can be NULL.
|
|
|
|
* @return NULL if rowIndex out of range and for illegal arguments
|
|
|
|
*/
|
|
|
|
U_CAPI uint32_t * U_EXPORT2
|
2002-02-25 18:44:07 +00:00
|
|
|
upvec_getRow(uint32_t *pv, int32_t rowIndex,
|
2004-08-30 22:11:48 +00:00
|
|
|
UChar32 *pRangeStart, UChar32 *pRangeLimit);
|
2002-02-25 18:44:07 +00:00
|
|
|
|
2005-01-02 00:21:25 +00:00
|
|
|
/*
|
|
|
|
* Compact the vectors:
|
|
|
|
* - modify the memory
|
|
|
|
* - keep only unique vectors
|
|
|
|
* - store them contiguously from the beginning of the memory
|
|
|
|
* - for each (non-unique) row, call the handler function
|
|
|
|
*
|
|
|
|
* The handler's rowIndex is the uint32_t index of the row in the compacted
|
|
|
|
* memory block.
|
|
|
|
* (Therefore, it starts at 0 increases in increments of the columns value.)
|
|
|
|
*/
|
|
|
|
|
|
|
|
typedef void U_CALLCONV
|
|
|
|
UPVecCompactHandler(void *context,
|
|
|
|
UChar32 start, UChar32 limit,
|
|
|
|
int32_t rowIndex, uint32_t *row, int32_t columns,
|
|
|
|
UErrorCode *pErrorCode);
|
|
|
|
|
2004-08-30 22:11:48 +00:00
|
|
|
U_CAPI int32_t U_EXPORT2
|
2005-01-02 00:21:25 +00:00
|
|
|
upvec_compact(uint32_t *pv, UPVecCompactHandler *handler, void *context, UErrorCode *pErrorCode);
|
|
|
|
|
|
|
|
/* context=UNewTrie, stores the rowIndex values into the trie */
|
|
|
|
U_CAPI void U_CALLCONV
|
|
|
|
upvec_compactToTrieHandler(void *context,
|
|
|
|
UChar32 start, UChar32 limit,
|
|
|
|
int32_t rowIndex, uint32_t *row, int32_t columns,
|
|
|
|
UErrorCode *pErrorCode);
|
2002-02-25 18:44:07 +00:00
|
|
|
|
|
|
|
#endif
|