2010-12-31 18:21:36 +00:00
|
|
|
/*
|
|
|
|
*******************************************************************************
|
2011-01-02 07:22:36 +00:00
|
|
|
* Copyright (C) 2010-2011, International Business Machines
|
2010-12-31 18:21:36 +00:00
|
|
|
* Corporation and others. All Rights Reserved.
|
|
|
|
*******************************************************************************
|
2011-01-05 21:05:47 +00:00
|
|
|
* file name: bytestriebuilder.h
|
2010-12-31 18:21:36 +00:00
|
|
|
* encoding: US-ASCII
|
|
|
|
* tab size: 8 (not used)
|
|
|
|
* indentation:4
|
|
|
|
*
|
|
|
|
* created on: 2010sep25
|
|
|
|
* created by: Markus W. Scherer
|
|
|
|
*/
|
|
|
|
|
2011-01-05 21:05:47 +00:00
|
|
|
#ifndef __BYTESTRIEBUILDER_H__
|
|
|
|
#define __BYTESTRIEBUILDER_H__
|
2010-12-31 18:21:36 +00:00
|
|
|
|
|
|
|
#include "unicode/utypes.h"
|
|
|
|
#include "unicode/stringpiece.h"
|
2011-01-05 21:05:47 +00:00
|
|
|
#include "bytestrie.h"
|
2010-12-31 18:21:36 +00:00
|
|
|
#include "charstr.h"
|
2011-01-05 21:05:47 +00:00
|
|
|
#include "stringtriebuilder.h"
|
2010-12-31 18:21:36 +00:00
|
|
|
|
|
|
|
U_NAMESPACE_BEGIN
|
|
|
|
|
2011-01-05 21:05:47 +00:00
|
|
|
class BytesTrieElement;
|
2010-12-31 18:21:36 +00:00
|
|
|
|
2011-01-05 21:05:47 +00:00
|
|
|
/**
|
|
|
|
* Builder class for BytesTrie.
|
|
|
|
*/
|
|
|
|
class U_TOOLUTIL_API BytesTrieBuilder : public StringTrieBuilder {
|
2010-12-31 18:21:36 +00:00
|
|
|
public:
|
2011-01-05 21:05:47 +00:00
|
|
|
BytesTrieBuilder()
|
2010-12-31 18:21:36 +00:00
|
|
|
: elements(NULL), elementsCapacity(0), elementsLength(0),
|
|
|
|
bytes(NULL), bytesCapacity(0), bytesLength(0) {}
|
2011-01-05 21:05:47 +00:00
|
|
|
virtual ~BytesTrieBuilder();
|
2010-12-31 18:21:36 +00:00
|
|
|
|
2011-01-05 21:05:47 +00:00
|
|
|
BytesTrieBuilder &add(const StringPiece &s, int32_t value, UErrorCode &errorCode);
|
2010-12-31 18:21:36 +00:00
|
|
|
|
2011-01-05 21:05:47 +00:00
|
|
|
StringPiece build(UStringTrieBuildOption buildOption, UErrorCode &errorCode);
|
2010-12-31 18:21:36 +00:00
|
|
|
|
2011-01-05 21:05:47 +00:00
|
|
|
BytesTrieBuilder &clear() {
|
2010-12-31 18:21:36 +00:00
|
|
|
strings.clear();
|
|
|
|
elementsLength=0;
|
|
|
|
bytesLength=0;
|
|
|
|
return *this;
|
|
|
|
}
|
|
|
|
|
|
|
|
private:
|
2011-01-02 07:22:36 +00:00
|
|
|
virtual int32_t getElementStringLength(int32_t i) const;
|
|
|
|
virtual UChar getElementUnit(int32_t i, int32_t byteIndex) const;
|
|
|
|
virtual int32_t getElementValue(int32_t i) const;
|
2010-12-31 18:21:36 +00:00
|
|
|
|
2011-01-06 05:04:51 +00:00
|
|
|
virtual int32_t getLimitOfLinearMatch(int32_t first, int32_t last, int32_t byteIndex) const;
|
2010-12-31 18:21:36 +00:00
|
|
|
|
2011-01-02 07:22:36 +00:00
|
|
|
virtual int32_t countElementUnits(int32_t start, int32_t limit, int32_t byteIndex) const;
|
|
|
|
virtual int32_t skipElementsBySomeUnits(int32_t i, int32_t byteIndex, int32_t count) const;
|
|
|
|
virtual int32_t indexOfElementWithNextUnit(int32_t i, int32_t byteIndex, UChar byte) const;
|
2010-12-31 18:21:36 +00:00
|
|
|
|
2011-01-02 07:22:36 +00:00
|
|
|
virtual UBool matchNodesCanHaveValues() const { return FALSE; }
|
2010-12-31 23:56:06 +00:00
|
|
|
|
2011-01-05 21:05:47 +00:00
|
|
|
virtual int32_t getMaxBranchLinearSubNodeLength() const { return BytesTrie::kMaxBranchLinearSubNodeLength; }
|
|
|
|
virtual int32_t getMinLinearMatch() const { return BytesTrie::kMinLinearMatch; }
|
|
|
|
virtual int32_t getMaxLinearMatchLength() const { return BytesTrie::kMaxLinearMatchLength; }
|
2010-12-31 18:21:36 +00:00
|
|
|
|
|
|
|
class BTLinearMatchNode : public LinearMatchNode {
|
|
|
|
public:
|
|
|
|
BTLinearMatchNode(const char *units, int32_t len, Node *nextNode);
|
|
|
|
virtual UBool operator==(const Node &other) const;
|
2011-01-05 21:05:47 +00:00
|
|
|
virtual void write(StringTrieBuilder &builder);
|
2010-12-31 18:21:36 +00:00
|
|
|
private:
|
|
|
|
const char *s;
|
|
|
|
};
|
|
|
|
|
2011-01-06 05:04:51 +00:00
|
|
|
virtual Node *createLinearMatchNode(int32_t i, int32_t byteIndex, int32_t length,
|
2011-01-02 07:22:36 +00:00
|
|
|
Node *nextNode) const;
|
2010-12-31 18:21:36 +00:00
|
|
|
|
2011-01-02 07:22:36 +00:00
|
|
|
UBool ensureCapacity(int32_t length);
|
|
|
|
virtual int32_t write(int32_t byte);
|
|
|
|
int32_t write(const char *b, int32_t length);
|
|
|
|
virtual int32_t writeElementUnits(int32_t i, int32_t byteIndex, int32_t length);
|
2011-01-06 05:04:51 +00:00
|
|
|
virtual int32_t writeValueAndFinal(int32_t i, UBool isFinal);
|
2011-01-02 07:22:36 +00:00
|
|
|
virtual int32_t writeValueAndType(UBool hasValue, int32_t value, int32_t node);
|
|
|
|
virtual int32_t writeDeltaTo(int32_t jumpTarget);
|
2010-12-31 18:21:36 +00:00
|
|
|
|
|
|
|
CharString strings;
|
2011-01-05 21:05:47 +00:00
|
|
|
BytesTrieElement *elements;
|
2010-12-31 18:21:36 +00:00
|
|
|
int32_t elementsCapacity;
|
|
|
|
int32_t elementsLength;
|
|
|
|
|
|
|
|
// Byte serialization of the trie.
|
|
|
|
// Grows from the back: bytesLength measures from the end of the buffer!
|
|
|
|
char *bytes;
|
|
|
|
int32_t bytesCapacity;
|
|
|
|
int32_t bytesLength;
|
|
|
|
};
|
|
|
|
|
|
|
|
U_NAMESPACE_END
|
|
|
|
|
2011-01-05 21:05:47 +00:00
|
|
|
#endif // __BYTESTRIEBUILDER_H__
|