1 /*
2 *******************************************************************************
3 * Copyright (C) 2010-2012, International Business Machines
4 * Corporation and others. All Rights Reserved.
5 *******************************************************************************
6 * file name: stringtriebuilder.cpp
7 * encoding: US-ASCII
8 * tab size: 8 (not used)
9 * indentation:4
10 *
11 * created on: 2010dec24
12 * created by: Markus W. Scherer
13 */
14
15 #include "utypeinfo.h" // for 'typeid' to work
16 #include "unicode/utypes.h"
17 #include "unicode/stringtriebuilder.h"
18 #include "uassert.h"
19 #include "uhash.h"
20
21 U_CDECL_BEGIN
22
23 static int32_t U_CALLCONV
hashStringTrieNode(const UHashTok key)24 hashStringTrieNode(const UHashTok key) {
25 return icu::StringTrieBuilder::hashNode(key.pointer);
26 }
27
28 static UBool U_CALLCONV
equalStringTrieNodes(const UHashTok key1,const UHashTok key2)29 equalStringTrieNodes(const UHashTok key1, const UHashTok key2) {
30 return icu::StringTrieBuilder::equalNodes(key1.pointer, key2.pointer);
31 }
32
33 U_CDECL_END
34
35 U_NAMESPACE_BEGIN
36
StringTrieBuilder()37 StringTrieBuilder::StringTrieBuilder() : nodes(NULL) {}
38
~StringTrieBuilder()39 StringTrieBuilder::~StringTrieBuilder() {
40 deleteCompactBuilder();
41 }
42
43 void
createCompactBuilder(int32_t sizeGuess,UErrorCode & errorCode)44 StringTrieBuilder::createCompactBuilder(int32_t sizeGuess, UErrorCode &errorCode) {
45 if(U_FAILURE(errorCode)) {
46 return;
47 }
48 nodes=uhash_openSize(hashStringTrieNode, equalStringTrieNodes, NULL,
49 sizeGuess, &errorCode);
50 if(U_SUCCESS(errorCode)) {
51 if(nodes==NULL) {
52 errorCode=U_MEMORY_ALLOCATION_ERROR;
53 } else {
54 uhash_setKeyDeleter(nodes, uprv_deleteUObject);
55 }
56 }
57 }
58
59 void
deleteCompactBuilder()60 StringTrieBuilder::deleteCompactBuilder() {
61 uhash_close(nodes);
62 nodes=NULL;
63 }
64
65 void
build(UStringTrieBuildOption buildOption,int32_t elementsLength,UErrorCode & errorCode)66 StringTrieBuilder::build(UStringTrieBuildOption buildOption, int32_t elementsLength,
67 UErrorCode &errorCode) {
68 if(buildOption==USTRINGTRIE_BUILD_FAST) {
69 writeNode(0, elementsLength, 0);
70 } else /* USTRINGTRIE_BUILD_SMALL */ {
71 createCompactBuilder(2*elementsLength, errorCode);
72 Node *root=makeNode(0, elementsLength, 0, errorCode);
73 if(U_SUCCESS(errorCode)) {
74 root->markRightEdgesFirst(-1);
75 root->write(*this);
76 }
77 deleteCompactBuilder();
78 }
79 }
80
81 // Requires start<limit,
82 // and all strings of the [start..limit[ elements must be sorted and
83 // have a common prefix of length unitIndex.
84 int32_t
writeNode(int32_t start,int32_t limit,int32_t unitIndex)85 StringTrieBuilder::writeNode(int32_t start, int32_t limit, int32_t unitIndex) {
86 UBool hasValue=FALSE;
87 int32_t value=0;
88 int32_t type;
89 if(unitIndex==getElementStringLength(start)) {
90 // An intermediate or final value.
91 value=getElementValue(start++);
92 if(start==limit) {
93 return writeValueAndFinal(value, TRUE); // final-value node
94 }
95 hasValue=TRUE;
96 }
97 // Now all [start..limit[ strings are longer than unitIndex.
98 int32_t minUnit=getElementUnit(start, unitIndex);
99 int32_t maxUnit=getElementUnit(limit-1, unitIndex);
100 if(minUnit==maxUnit) {
101 // Linear-match node: All strings have the same character at unitIndex.
102 int32_t lastUnitIndex=getLimitOfLinearMatch(start, limit-1, unitIndex);
103 writeNode(start, limit, lastUnitIndex);
104 // Break the linear-match sequence into chunks of at most kMaxLinearMatchLength.
105 int32_t length=lastUnitIndex-unitIndex;
106 int32_t maxLinearMatchLength=getMaxLinearMatchLength();
107 while(length>maxLinearMatchLength) {
108 lastUnitIndex-=maxLinearMatchLength;
109 length-=maxLinearMatchLength;
110 writeElementUnits(start, lastUnitIndex, maxLinearMatchLength);
111 write(getMinLinearMatch()+maxLinearMatchLength-1);
112 }
113 writeElementUnits(start, unitIndex, length);
114 type=getMinLinearMatch()+length-1;
115 } else {
116 // Branch node.
117 int32_t length=countElementUnits(start, limit, unitIndex);
118 // length>=2 because minUnit!=maxUnit.
119 writeBranchSubNode(start, limit, unitIndex, length);
120 if(--length<getMinLinearMatch()) {
121 type=length;
122 } else {
123 write(length);
124 type=0;
125 }
126 }
127 return writeValueAndType(hasValue, value, type);
128 }
129
130 // start<limit && all strings longer than unitIndex &&
131 // length different units at unitIndex
132 int32_t
writeBranchSubNode(int32_t start,int32_t limit,int32_t unitIndex,int32_t length)133 StringTrieBuilder::writeBranchSubNode(int32_t start, int32_t limit, int32_t unitIndex, int32_t length) {
134 UChar middleUnits[kMaxSplitBranchLevels];
135 int32_t lessThan[kMaxSplitBranchLevels];
136 int32_t ltLength=0;
137 while(length>getMaxBranchLinearSubNodeLength()) {
138 // Branch on the middle unit.
139 // First, find the middle unit.
140 int32_t i=skipElementsBySomeUnits(start, unitIndex, length/2);
141 // Encode the less-than branch first.
142 middleUnits[ltLength]=getElementUnit(i, unitIndex); // middle unit
143 lessThan[ltLength]=writeBranchSubNode(start, i, unitIndex, length/2);
144 ++ltLength;
145 // Continue for the greater-or-equal branch.
146 start=i;
147 length=length-length/2;
148 }
149 // For each unit, find its elements array start and whether it has a final value.
150 int32_t starts[kMaxBranchLinearSubNodeLength];
151 UBool isFinal[kMaxBranchLinearSubNodeLength-1];
152 int32_t unitNumber=0;
153 do {
154 int32_t i=starts[unitNumber]=start;
155 UChar unit=getElementUnit(i++, unitIndex);
156 i=indexOfElementWithNextUnit(i, unitIndex, unit);
157 isFinal[unitNumber]= start==i-1 && unitIndex+1==getElementStringLength(start);
158 start=i;
159 } while(++unitNumber<length-1);
160 // unitNumber==length-1, and the maxUnit elements range is [start..limit[
161 starts[unitNumber]=start;
162
163 // Write the sub-nodes in reverse order: The jump lengths are deltas from
164 // after their own positions, so if we wrote the minUnit sub-node first,
165 // then its jump delta would be larger.
166 // Instead we write the minUnit sub-node last, for a shorter delta.
167 int32_t jumpTargets[kMaxBranchLinearSubNodeLength-1];
168 do {
169 --unitNumber;
170 if(!isFinal[unitNumber]) {
171 jumpTargets[unitNumber]=writeNode(starts[unitNumber], starts[unitNumber+1], unitIndex+1);
172 }
173 } while(unitNumber>0);
174 // The maxUnit sub-node is written as the very last one because we do
175 // not jump for it at all.
176 unitNumber=length-1;
177 writeNode(start, limit, unitIndex+1);
178 int32_t offset=write(getElementUnit(start, unitIndex));
179 // Write the rest of this node's unit-value pairs.
180 while(--unitNumber>=0) {
181 start=starts[unitNumber];
182 int32_t value;
183 if(isFinal[unitNumber]) {
184 // Write the final value for the one string ending with this unit.
185 value=getElementValue(start);
186 } else {
187 // Write the delta to the start position of the sub-node.
188 value=offset-jumpTargets[unitNumber];
189 }
190 writeValueAndFinal(value, isFinal[unitNumber]);
191 offset=write(getElementUnit(start, unitIndex));
192 }
193 // Write the split-branch nodes.
194 while(ltLength>0) {
195 --ltLength;
196 writeDeltaTo(lessThan[ltLength]);
197 offset=write(middleUnits[ltLength]);
198 }
199 return offset;
200 }
201
202 // Requires start<limit,
203 // and all strings of the [start..limit[ elements must be sorted and
204 // have a common prefix of length unitIndex.
205 StringTrieBuilder::Node *
makeNode(int32_t start,int32_t limit,int32_t unitIndex,UErrorCode & errorCode)206 StringTrieBuilder::makeNode(int32_t start, int32_t limit, int32_t unitIndex, UErrorCode &errorCode) {
207 if(U_FAILURE(errorCode)) {
208 return NULL;
209 }
210 UBool hasValue=FALSE;
211 int32_t value=0;
212 if(unitIndex==getElementStringLength(start)) {
213 // An intermediate or final value.
214 value=getElementValue(start++);
215 if(start==limit) {
216 return registerFinalValue(value, errorCode);
217 }
218 hasValue=TRUE;
219 }
220 Node *node;
221 // Now all [start..limit[ strings are longer than unitIndex.
222 int32_t minUnit=getElementUnit(start, unitIndex);
223 int32_t maxUnit=getElementUnit(limit-1, unitIndex);
224 if(minUnit==maxUnit) {
225 // Linear-match node: All strings have the same character at unitIndex.
226 int32_t lastUnitIndex=getLimitOfLinearMatch(start, limit-1, unitIndex);
227 Node *nextNode=makeNode(start, limit, lastUnitIndex, errorCode);
228 // Break the linear-match sequence into chunks of at most kMaxLinearMatchLength.
229 int32_t length=lastUnitIndex-unitIndex;
230 int32_t maxLinearMatchLength=getMaxLinearMatchLength();
231 while(length>maxLinearMatchLength) {
232 lastUnitIndex-=maxLinearMatchLength;
233 length-=maxLinearMatchLength;
234 node=createLinearMatchNode(start, lastUnitIndex, maxLinearMatchLength, nextNode);
235 nextNode=registerNode(node, errorCode);
236 }
237 node=createLinearMatchNode(start, unitIndex, length, nextNode);
238 } else {
239 // Branch node.
240 int32_t length=countElementUnits(start, limit, unitIndex);
241 // length>=2 because minUnit!=maxUnit.
242 Node *subNode=makeBranchSubNode(start, limit, unitIndex, length, errorCode);
243 node=new BranchHeadNode(length, subNode);
244 }
245 if(hasValue && node!=NULL) {
246 if(matchNodesCanHaveValues()) {
247 ((ValueNode *)node)->setValue(value);
248 } else {
249 node=new IntermediateValueNode(value, registerNode(node, errorCode));
250 }
251 }
252 return registerNode(node, errorCode);
253 }
254
255 // start<limit && all strings longer than unitIndex &&
256 // length different units at unitIndex
257 StringTrieBuilder::Node *
makeBranchSubNode(int32_t start,int32_t limit,int32_t unitIndex,int32_t length,UErrorCode & errorCode)258 StringTrieBuilder::makeBranchSubNode(int32_t start, int32_t limit, int32_t unitIndex,
259 int32_t length, UErrorCode &errorCode) {
260 if(U_FAILURE(errorCode)) {
261 return NULL;
262 }
263 UChar middleUnits[kMaxSplitBranchLevels];
264 Node *lessThan[kMaxSplitBranchLevels];
265 int32_t ltLength=0;
266 while(length>getMaxBranchLinearSubNodeLength()) {
267 // Branch on the middle unit.
268 // First, find the middle unit.
269 int32_t i=skipElementsBySomeUnits(start, unitIndex, length/2);
270 // Create the less-than branch.
271 middleUnits[ltLength]=getElementUnit(i, unitIndex); // middle unit
272 lessThan[ltLength]=makeBranchSubNode(start, i, unitIndex, length/2, errorCode);
273 ++ltLength;
274 // Continue for the greater-or-equal branch.
275 start=i;
276 length=length-length/2;
277 }
278 if(U_FAILURE(errorCode)) {
279 return NULL;
280 }
281 ListBranchNode *listNode=new ListBranchNode();
282 if(listNode==NULL) {
283 errorCode=U_MEMORY_ALLOCATION_ERROR;
284 return NULL;
285 }
286 // For each unit, find its elements array start and whether it has a final value.
287 int32_t unitNumber=0;
288 do {
289 int32_t i=start;
290 UChar unit=getElementUnit(i++, unitIndex);
291 i=indexOfElementWithNextUnit(i, unitIndex, unit);
292 if(start==i-1 && unitIndex+1==getElementStringLength(start)) {
293 listNode->add(unit, getElementValue(start));
294 } else {
295 listNode->add(unit, makeNode(start, i, unitIndex+1, errorCode));
296 }
297 start=i;
298 } while(++unitNumber<length-1);
299 // unitNumber==length-1, and the maxUnit elements range is [start..limit[
300 UChar unit=getElementUnit(start, unitIndex);
301 if(start==limit-1 && unitIndex+1==getElementStringLength(start)) {
302 listNode->add(unit, getElementValue(start));
303 } else {
304 listNode->add(unit, makeNode(start, limit, unitIndex+1, errorCode));
305 }
306 Node *node=registerNode(listNode, errorCode);
307 // Create the split-branch nodes.
308 while(ltLength>0) {
309 --ltLength;
310 node=registerNode(
311 new SplitBranchNode(middleUnits[ltLength], lessThan[ltLength], node), errorCode);
312 }
313 return node;
314 }
315
316 StringTrieBuilder::Node *
registerNode(Node * newNode,UErrorCode & errorCode)317 StringTrieBuilder::registerNode(Node *newNode, UErrorCode &errorCode) {
318 if(U_FAILURE(errorCode)) {
319 delete newNode;
320 return NULL;
321 }
322 if(newNode==NULL) {
323 errorCode=U_MEMORY_ALLOCATION_ERROR;
324 return NULL;
325 }
326 const UHashElement *old=uhash_find(nodes, newNode);
327 if(old!=NULL) {
328 delete newNode;
329 return (Node *)old->key.pointer;
330 }
331 // If uhash_puti() returns a non-zero value from an equivalent, previously
332 // registered node, then uhash_find() failed to find that and we will leak newNode.
333 #if U_DEBUG
334 int32_t oldValue= // Only in debug mode to avoid a compiler warning about unused oldValue.
335 #endif
336 uhash_puti(nodes, newNode, 1, &errorCode);
337 U_ASSERT(oldValue==0);
338 if(U_FAILURE(errorCode)) {
339 delete newNode;
340 return NULL;
341 }
342 return newNode;
343 }
344
345 StringTrieBuilder::Node *
registerFinalValue(int32_t value,UErrorCode & errorCode)346 StringTrieBuilder::registerFinalValue(int32_t value, UErrorCode &errorCode) {
347 if(U_FAILURE(errorCode)) {
348 return NULL;
349 }
350 FinalValueNode key(value);
351 const UHashElement *old=uhash_find(nodes, &key);
352 if(old!=NULL) {
353 return (Node *)old->key.pointer;
354 }
355 Node *newNode=new FinalValueNode(value);
356 if(newNode==NULL) {
357 errorCode=U_MEMORY_ALLOCATION_ERROR;
358 return NULL;
359 }
360 // If uhash_puti() returns a non-zero value from an equivalent, previously
361 // registered node, then uhash_find() failed to find that and we will leak newNode.
362 #if U_DEBUG
363 int32_t oldValue= // Only in debug mode to avoid a compiler warning about unused oldValue.
364 #endif
365 uhash_puti(nodes, newNode, 1, &errorCode);
366 U_ASSERT(oldValue==0);
367 if(U_FAILURE(errorCode)) {
368 delete newNode;
369 return NULL;
370 }
371 return newNode;
372 }
373
374 UBool
hashNode(const void * node)375 StringTrieBuilder::hashNode(const void *node) {
376 return ((const Node *)node)->hashCode();
377 }
378
379 UBool
equalNodes(const void * left,const void * right)380 StringTrieBuilder::equalNodes(const void *left, const void *right) {
381 return *(const Node *)left==*(const Node *)right;
382 }
383
384 UOBJECT_DEFINE_NO_RTTI_IMPLEMENTATION(StringTrieBuilder)
385
386 UBool
387 StringTrieBuilder::Node::operator==(const Node &other) const {
388 return this==&other || (typeid(*this)==typeid(other) && hash==other.hash);
389 }
390
391 int32_t
markRightEdgesFirst(int32_t edgeNumber)392 StringTrieBuilder::Node::markRightEdgesFirst(int32_t edgeNumber) {
393 if(offset==0) {
394 offset=edgeNumber;
395 }
396 return edgeNumber;
397 }
398
399 UOBJECT_DEFINE_NO_RTTI_IMPLEMENTATION(StringTrieBuilder::Node)
400
401 UBool
402 StringTrieBuilder::FinalValueNode::operator==(const Node &other) const {
403 if(this==&other) {
404 return TRUE;
405 }
406 if(!Node::operator==(other)) {
407 return FALSE;
408 }
409 const FinalValueNode &o=(const FinalValueNode &)other;
410 return value==o.value;
411 }
412
413 void
write(StringTrieBuilder & builder)414 StringTrieBuilder::FinalValueNode::write(StringTrieBuilder &builder) {
415 offset=builder.writeValueAndFinal(value, TRUE);
416 }
417
418 UBool
operator ==(const Node & other) const419 StringTrieBuilder::ValueNode::operator==(const Node &other) const {
420 if(this==&other) {
421 return TRUE;
422 }
423 if(!Node::operator==(other)) {
424 return FALSE;
425 }
426 const ValueNode &o=(const ValueNode &)other;
427 return hasValue==o.hasValue && (!hasValue || value==o.value);
428 }
429
430 UBool
operator ==(const Node & other) const431 StringTrieBuilder::IntermediateValueNode::operator==(const Node &other) const {
432 if(this==&other) {
433 return TRUE;
434 }
435 if(!ValueNode::operator==(other)) {
436 return FALSE;
437 }
438 const IntermediateValueNode &o=(const IntermediateValueNode &)other;
439 return next==o.next;
440 }
441
442 int32_t
markRightEdgesFirst(int32_t edgeNumber)443 StringTrieBuilder::IntermediateValueNode::markRightEdgesFirst(int32_t edgeNumber) {
444 if(offset==0) {
445 offset=edgeNumber=next->markRightEdgesFirst(edgeNumber);
446 }
447 return edgeNumber;
448 }
449
450 void
write(StringTrieBuilder & builder)451 StringTrieBuilder::IntermediateValueNode::write(StringTrieBuilder &builder) {
452 next->write(builder);
453 offset=builder.writeValueAndFinal(value, FALSE);
454 }
455
456 UBool
operator ==(const Node & other) const457 StringTrieBuilder::LinearMatchNode::operator==(const Node &other) const {
458 if(this==&other) {
459 return TRUE;
460 }
461 if(!ValueNode::operator==(other)) {
462 return FALSE;
463 }
464 const LinearMatchNode &o=(const LinearMatchNode &)other;
465 return length==o.length && next==o.next;
466 }
467
468 int32_t
markRightEdgesFirst(int32_t edgeNumber)469 StringTrieBuilder::LinearMatchNode::markRightEdgesFirst(int32_t edgeNumber) {
470 if(offset==0) {
471 offset=edgeNumber=next->markRightEdgesFirst(edgeNumber);
472 }
473 return edgeNumber;
474 }
475
476 UBool
operator ==(const Node & other) const477 StringTrieBuilder::ListBranchNode::operator==(const Node &other) const {
478 if(this==&other) {
479 return TRUE;
480 }
481 if(!Node::operator==(other)) {
482 return FALSE;
483 }
484 const ListBranchNode &o=(const ListBranchNode &)other;
485 for(int32_t i=0; i<length; ++i) {
486 if(units[i]!=o.units[i] || values[i]!=o.values[i] || equal[i]!=o.equal[i]) {
487 return FALSE;
488 }
489 }
490 return TRUE;
491 }
492
493 int32_t
markRightEdgesFirst(int32_t edgeNumber)494 StringTrieBuilder::ListBranchNode::markRightEdgesFirst(int32_t edgeNumber) {
495 if(offset==0) {
496 firstEdgeNumber=edgeNumber;
497 int32_t step=0;
498 int32_t i=length;
499 do {
500 Node *edge=equal[--i];
501 if(edge!=NULL) {
502 edgeNumber=edge->markRightEdgesFirst(edgeNumber-step);
503 }
504 // For all but the rightmost edge, decrement the edge number.
505 step=1;
506 } while(i>0);
507 offset=edgeNumber;
508 }
509 return edgeNumber;
510 }
511
512 void
write(StringTrieBuilder & builder)513 StringTrieBuilder::ListBranchNode::write(StringTrieBuilder &builder) {
514 // Write the sub-nodes in reverse order: The jump lengths are deltas from
515 // after their own positions, so if we wrote the minUnit sub-node first,
516 // then its jump delta would be larger.
517 // Instead we write the minUnit sub-node last, for a shorter delta.
518 int32_t unitNumber=length-1;
519 Node *rightEdge=equal[unitNumber];
520 int32_t rightEdgeNumber= rightEdge==NULL ? firstEdgeNumber : rightEdge->getOffset();
521 do {
522 --unitNumber;
523 if(equal[unitNumber]!=NULL) {
524 equal[unitNumber]->writeUnlessInsideRightEdge(firstEdgeNumber, rightEdgeNumber, builder);
525 }
526 } while(unitNumber>0);
527 // The maxUnit sub-node is written as the very last one because we do
528 // not jump for it at all.
529 unitNumber=length-1;
530 if(rightEdge==NULL) {
531 builder.writeValueAndFinal(values[unitNumber], TRUE);
532 } else {
533 rightEdge->write(builder);
534 }
535 offset=builder.write(units[unitNumber]);
536 // Write the rest of this node's unit-value pairs.
537 while(--unitNumber>=0) {
538 int32_t value;
539 UBool isFinal;
540 if(equal[unitNumber]==NULL) {
541 // Write the final value for the one string ending with this unit.
542 value=values[unitNumber];
543 isFinal=TRUE;
544 } else {
545 // Write the delta to the start position of the sub-node.
546 U_ASSERT(equal[unitNumber]->getOffset()>0);
547 value=offset-equal[unitNumber]->getOffset();
548 isFinal=FALSE;
549 }
550 builder.writeValueAndFinal(value, isFinal);
551 offset=builder.write(units[unitNumber]);
552 }
553 }
554
555 UBool
operator ==(const Node & other) const556 StringTrieBuilder::SplitBranchNode::operator==(const Node &other) const {
557 if(this==&other) {
558 return TRUE;
559 }
560 if(!Node::operator==(other)) {
561 return FALSE;
562 }
563 const SplitBranchNode &o=(const SplitBranchNode &)other;
564 return unit==o.unit && lessThan==o.lessThan && greaterOrEqual==o.greaterOrEqual;
565 }
566
567 int32_t
markRightEdgesFirst(int32_t edgeNumber)568 StringTrieBuilder::SplitBranchNode::markRightEdgesFirst(int32_t edgeNumber) {
569 if(offset==0) {
570 firstEdgeNumber=edgeNumber;
571 edgeNumber=greaterOrEqual->markRightEdgesFirst(edgeNumber);
572 offset=edgeNumber=lessThan->markRightEdgesFirst(edgeNumber-1);
573 }
574 return edgeNumber;
575 }
576
577 void
write(StringTrieBuilder & builder)578 StringTrieBuilder::SplitBranchNode::write(StringTrieBuilder &builder) {
579 // Encode the less-than branch first.
580 lessThan->writeUnlessInsideRightEdge(firstEdgeNumber, greaterOrEqual->getOffset(), builder);
581 // Encode the greater-or-equal branch last because we do not jump for it at all.
582 greaterOrEqual->write(builder);
583 // Write this node.
584 U_ASSERT(lessThan->getOffset()>0);
585 builder.writeDeltaTo(lessThan->getOffset()); // less-than
586 offset=builder.write(unit);
587 }
588
589 UBool
operator ==(const Node & other) const590 StringTrieBuilder::BranchHeadNode::operator==(const Node &other) const {
591 if(this==&other) {
592 return TRUE;
593 }
594 if(!ValueNode::operator==(other)) {
595 return FALSE;
596 }
597 const BranchHeadNode &o=(const BranchHeadNode &)other;
598 return length==o.length && next==o.next;
599 }
600
601 int32_t
markRightEdgesFirst(int32_t edgeNumber)602 StringTrieBuilder::BranchHeadNode::markRightEdgesFirst(int32_t edgeNumber) {
603 if(offset==0) {
604 offset=edgeNumber=next->markRightEdgesFirst(edgeNumber);
605 }
606 return edgeNumber;
607 }
608
609 void
write(StringTrieBuilder & builder)610 StringTrieBuilder::BranchHeadNode::write(StringTrieBuilder &builder) {
611 next->write(builder);
612 if(length<=builder.getMinLinearMatch()) {
613 offset=builder.writeValueAndType(hasValue, value, length-1);
614 } else {
615 builder.write(length-1);
616 offset=builder.writeValueAndType(hasValue, value, 0);
617 }
618 }
619
620 U_NAMESPACE_END
621