ICU 62.1 62.1
bytestriebuilder.h
Go to the documentation of this file.
1// © 2016 and later: Unicode, Inc. and others.
2// License & terms of use: http://www.unicode.org/copyright.html
3/*
4*******************************************************************************
5* Copyright (C) 2010-2016, International Business Machines
6* Corporation and others. All Rights Reserved.
7*******************************************************************************
8* file name: bytestriebuilder.h
9* encoding: UTF-8
10* tab size: 8 (not used)
11* indentation:4
12*
13* created on: 2010sep25
14* created by: Markus W. Scherer
15*/
16
22#ifndef __BYTESTRIEBUILDER_H__
23#define __BYTESTRIEBUILDER_H__
24
25#include "unicode/utypes.h"
26#include "unicode/bytestrie.h"
27#include "unicode/stringpiece.h"
29
31
32class BytesTrieElement;
33class CharString;
41public:
48
54
69 BytesTrieBuilder &add(StringPiece s, int32_t value, UErrorCode &errorCode);
70
90
114
122
123private:
124 BytesTrieBuilder(const BytesTrieBuilder &other); // no copy constructor
125 BytesTrieBuilder &operator=(const BytesTrieBuilder &other); // no assignment operator
126
127 void buildBytes(UStringTrieBuildOption buildOption, UErrorCode &errorCode);
128
129 virtual int32_t getElementStringLength(int32_t i) const;
130 virtual char16_t getElementUnit(int32_t i, int32_t byteIndex) const;
131 virtual int32_t getElementValue(int32_t i) const;
132
133 virtual int32_t getLimitOfLinearMatch(int32_t first, int32_t last, int32_t byteIndex) const;
134
135 virtual int32_t countElementUnits(int32_t start, int32_t limit, int32_t byteIndex) const;
136 virtual int32_t skipElementsBySomeUnits(int32_t i, int32_t byteIndex, int32_t count) const;
137 virtual int32_t indexOfElementWithNextUnit(int32_t i, int32_t byteIndex, char16_t byte) const;
138
139 virtual UBool matchNodesCanHaveValues() const { return FALSE; }
140
141 virtual int32_t getMaxBranchLinearSubNodeLength() const { return BytesTrie::kMaxBranchLinearSubNodeLength; }
142 virtual int32_t getMinLinearMatch() const { return BytesTrie::kMinLinearMatch; }
143 virtual int32_t getMaxLinearMatchLength() const { return BytesTrie::kMaxLinearMatchLength; }
144
148 class BTLinearMatchNode : public LinearMatchNode {
149 public:
150 BTLinearMatchNode(const char *units, int32_t len, Node *nextNode);
151 virtual UBool operator==(const Node &other) const;
152 virtual void write(StringTrieBuilder &builder);
153 private:
154 const char *s;
155 };
156
157 virtual Node *createLinearMatchNode(int32_t i, int32_t byteIndex, int32_t length,
158 Node *nextNode) const;
159
160 UBool ensureCapacity(int32_t length);
161 virtual int32_t write(int32_t byte);
162 int32_t write(const char *b, int32_t length);
163 virtual int32_t writeElementUnits(int32_t i, int32_t byteIndex, int32_t length);
164 virtual int32_t writeValueAndFinal(int32_t i, UBool isFinal);
165 virtual int32_t writeValueAndType(UBool hasValue, int32_t value, int32_t node);
166 virtual int32_t writeDeltaTo(int32_t jumpTarget);
167
168 CharString *strings; // Pointer not object so we need not #include internal charstr.h.
169 BytesTrieElement *elements;
170 int32_t elementsCapacity;
171 int32_t elementsLength;
172
173 // Byte serialization of the trie.
174 // Grows from the back: bytesLength measures from the end of the buffer!
175 char *bytes;
176 int32_t bytesCapacity;
177 int32_t bytesLength;
178};
179
181
182#endif // __BYTESTRIEBUILDER_H__
C++ API: Trie for mapping byte sequences to integer values.
Builder class for BytesTrie.
BytesTrieBuilder & add(StringPiece s, int32_t value, UErrorCode &errorCode)
Adds a (byte sequence, value) pair.
StringPiece buildStringPiece(UStringTrieBuildOption buildOption, UErrorCode &errorCode)
Builds a BytesTrie for the add()ed data and byte-serializes it.
BytesTrie * build(UStringTrieBuildOption buildOption, UErrorCode &errorCode)
Builds a BytesTrie for the add()ed data.
BytesTrieBuilder(UErrorCode &errorCode)
Constructs an empty builder.
virtual ~BytesTrieBuilder()
Destructor.
BytesTrieBuilder & clear()
Removes all (byte sequence, value) pairs.
Light-weight, non-const reader class for a BytesTrie.
Definition bytestrie.h:50
A string-like object that points to a sized piece of memory.
Definition stringpiece.h:54
Base class for string trie builder classes.
virtual int32_t writeValueAndFinal(int32_t i, UBool isFinal)=0
virtual int32_t getMaxBranchLinearSubNodeLength() const =0
virtual int32_t countElementUnits(int32_t start, int32_t limit, int32_t unitIndex) const =0
virtual int32_t writeDeltaTo(int32_t jumpTarget)=0
virtual int32_t getLimitOfLinearMatch(int32_t first, int32_t last, int32_t unitIndex) const =0
virtual int32_t getElementValue(int32_t i) const =0
virtual int32_t getMinLinearMatch() const =0
virtual int32_t skipElementsBySomeUnits(int32_t i, int32_t unitIndex, int32_t count) const =0
virtual int32_t writeValueAndType(UBool hasValue, int32_t value, int32_t node)=0
virtual int32_t indexOfElementWithNextUnit(int32_t i, int32_t unitIndex, char16_t unit) const =0
virtual UBool matchNodesCanHaveValues() const =0
virtual int32_t write(int32_t unit)=0
virtual char16_t getElementUnit(int32_t i, int32_t unitIndex) const =0
virtual Node * createLinearMatchNode(int32_t i, int32_t unitIndex, int32_t length, Node *nextNode) const =0
virtual int32_t getMaxLinearMatchLength() const =0
virtual int32_t getElementStringLength(int32_t i) const =0
virtual int32_t writeElementUnits(int32_t i, int32_t unitIndex, int32_t length)=0
U_EXPORT UBool operator==(const StringPiece &x, const StringPiece &y)
Global operator == for StringPiece.
C++ API: StringPiece: Read-only byte string wrapper class.
C++ API: Builder API for trie builders.
UStringTrieBuildOption
Build options for BytesTrieBuilder and CharsTrieBuilder.
int8_t UBool
The ICU boolean type.
Definition umachine.h:236
#define FALSE
The FALSE value of a UBool.
Definition umachine.h:244
Basic definitions for ICU, for both C and C++ APIs.
UErrorCode
Error code to replace exception handling, so that the code is compatible with all C++ compilers,...
Definition utypes.h:396
#define U_COMMON_API
Set to export library symbols from inside the common library, and to import them from outside.
Definition utypes.h:359
#define U_NAMESPACE_END
This is used to end a declaration of a public ICU C++ API.
Definition uversion.h:138
#define U_NAMESPACE_BEGIN
This is used to begin a declaration of a public ICU C++ API.
Definition uversion.h:137