ICU 57.1 57.1
bytestriebuilder.h
Go to the documentation of this file.
1/*
2*******************************************************************************
3* Copyright (C) 2010-2016, International Business Machines
4* Corporation and others. All Rights Reserved.
5*******************************************************************************
6* file name: bytestriebuilder.h
7* encoding: US-ASCII
8* tab size: 8 (not used)
9* indentation:4
10*
11* created on: 2010sep25
12* created by: Markus W. Scherer
13*/
14
20#ifndef __BYTESTRIEBUILDER_H__
21#define __BYTESTRIEBUILDER_H__
22
23#include "unicode/utypes.h"
24#include "unicode/bytestrie.h"
25#include "unicode/stringpiece.h"
27
29
30class BytesTrieElement;
31class CharString;
32
40public:
47
53
68 BytesTrieBuilder &add(const StringPiece &s, int32_t value, UErrorCode &errorCode);
69
89
113
121
122private:
123 BytesTrieBuilder(const BytesTrieBuilder &other); // no copy constructor
124 BytesTrieBuilder &operator=(const BytesTrieBuilder &other); // no assignment operator
125
126 void buildBytes(UStringTrieBuildOption buildOption, UErrorCode &errorCode);
127
128 virtual int32_t getElementStringLength(int32_t i) const;
129 virtual UChar getElementUnit(int32_t i, int32_t byteIndex) const;
130 virtual int32_t getElementValue(int32_t i) const;
131
132 virtual int32_t getLimitOfLinearMatch(int32_t first, int32_t last, int32_t byteIndex) const;
133
134 virtual int32_t countElementUnits(int32_t start, int32_t limit, int32_t byteIndex) const;
135 virtual int32_t skipElementsBySomeUnits(int32_t i, int32_t byteIndex, int32_t count) const;
136 virtual int32_t indexOfElementWithNextUnit(int32_t i, int32_t byteIndex, UChar byte) const;
137
138 virtual UBool matchNodesCanHaveValues() const { return FALSE; }
139
140 virtual int32_t getMaxBranchLinearSubNodeLength() const { return BytesTrie::kMaxBranchLinearSubNodeLength; }
141 virtual int32_t getMinLinearMatch() const { return BytesTrie::kMinLinearMatch; }
142 virtual int32_t getMaxLinearMatchLength() const { return BytesTrie::kMaxLinearMatchLength; }
143
144 // don't use #ifndef U_HIDE_INTERNAL_API with private class members
148 class BTLinearMatchNode : public LinearMatchNode {
149 public:
150 BTLinearMatchNode(const char *units, int32_t len, Node *nextNode);
151 virtual UBool operator==(const Node &other) const;
152 virtual void write(StringTrieBuilder &builder);
153 private:
154 const char *s;
155 };
156
157 // don't use #ifndef U_HIDE_INTERNAL_API with private class members or virtual methods.
158 virtual Node *createLinearMatchNode(int32_t i, int32_t byteIndex, int32_t length,
159 Node *nextNode) const;
160
161 UBool ensureCapacity(int32_t length);
162 virtual int32_t write(int32_t byte);
163 int32_t write(const char *b, int32_t length);
164 virtual int32_t writeElementUnits(int32_t i, int32_t byteIndex, int32_t length);
165 virtual int32_t writeValueAndFinal(int32_t i, UBool isFinal);
166 virtual int32_t writeValueAndType(UBool hasValue, int32_t value, int32_t node);
167 virtual int32_t writeDeltaTo(int32_t jumpTarget);
168
169 CharString *strings; // Pointer not object so we need not #include internal charstr.h.
170 BytesTrieElement *elements;
171 int32_t elementsCapacity;
172 int32_t elementsLength;
173
174 // Byte serialization of the trie.
175 // Grows from the back: bytesLength measures from the end of the buffer!
176 char *bytes;
177 int32_t bytesCapacity;
178 int32_t bytesLength;
179};
180
182
183#endif // __BYTESTRIEBUILDER_H__
C++ API: Trie for mapping byte sequences to integer values.
Builder class for BytesTrie.
BytesTrieBuilder(UErrorCode &errorCode)
Constructs an empty builder.
StringPiece buildStringPiece(UStringTrieBuildOption buildOption, UErrorCode &errorCode)
Builds a BytesTrie for the add()ed data and byte-serializes it.
BytesTrieBuilder & add(const StringPiece &s, int32_t value, UErrorCode &errorCode)
Adds a (byte sequence, value) pair.
virtual ~BytesTrieBuilder()
Destructor.
BytesTrieBuilder & clear()
Removes all (byte sequence, value) pairs.
BytesTrie * build(UStringTrieBuildOption buildOption, UErrorCode &errorCode)
Builds a BytesTrie for the add()ed data.
Light-weight, non-const reader class for a BytesTrie.
Definition: bytestrie.h:48
A string-like object that points to a sized piece of memory.
Definition: stringpiece.h:52
Base class for string trie builder classes.
virtual int32_t skipElementsBySomeUnits(int32_t i, int32_t unitIndex, int32_t count) const =0
virtual int32_t countElementUnits(int32_t start, int32_t limit, int32_t unitIndex) const =0
virtual int32_t getMaxBranchLinearSubNodeLength() const =0
virtual int32_t write(int32_t unit)=0
virtual Node * createLinearMatchNode(int32_t i, int32_t unitIndex, int32_t length, Node *nextNode) const =0
virtual int32_t indexOfElementWithNextUnit(int32_t i, int32_t unitIndex, UChar unit) const =0
virtual int32_t getMinLinearMatch() const =0
virtual int32_t getElementValue(int32_t i) const =0
virtual int32_t getElementStringLength(int32_t i) const =0
virtual UChar getElementUnit(int32_t i, int32_t unitIndex) const =0
virtual UBool matchNodesCanHaveValues() const =0
virtual int32_t writeValueAndFinal(int32_t i, UBool isFinal)=0
virtual int32_t getLimitOfLinearMatch(int32_t first, int32_t last, int32_t unitIndex) const =0
virtual int32_t writeElementUnits(int32_t i, int32_t unitIndex, int32_t length)=0
virtual int32_t writeDeltaTo(int32_t jumpTarget)=0
virtual int32_t getMaxLinearMatchLength() const =0
virtual int32_t writeValueAndType(UBool hasValue, int32_t value, int32_t node)=0
C++ API: StringPiece: Read-only byte string wrapper class.
U_EXPORT UBool operator==(const StringPiece &x, const StringPiece &y)
Global operator == for StringPiece.
C++ API: Builder API for trie builders.
UStringTrieBuildOption
Build options for BytesTrieBuilder and CharsTrieBuilder.
int8_t UBool
The ICU boolean type.
Definition: umachine.h:234
uint16_t UChar
Define UChar to be UCHAR_TYPE, if that is #defined (for example, to char16_t), or wchar_t if that is ...
Definition: umachine.h:312
#define FALSE
The FALSE value of a UBool.
Definition: umachine.h:242
Basic definitions for ICU, for both C and C++ APIs.
UErrorCode
Error code to replace exception handling, so that the code is compatible with all C++ compilers,...
Definition: utypes.h:476
#define U_COMMON_API
Set to export library symbols from inside the common library, and to import them from outside.
Definition: utypes.h:357
#define U_NAMESPACE_END
This is used to end a declaration of a public ICU C++ API.
Definition: uversion.h:130
#define U_NAMESPACE_BEGIN
This is used to begin a declaration of a public ICU C++ API.
Definition: uversion.h:129