1 // © 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /*
4 ******************************************************************************
5 *
6 * Copyright (C) 2001-2014, International Business Machines
7 * Corporation and others. All Rights Reserved.
8 *
9 ******************************************************************************
10 * file name: trietest.c
11 * encoding: UTF-8
12 * tab size: 8 (not used)
13 * indentation:4
14 *
15 * created on: 2008sep01 (starting from a copy of trietest.c)
16 * created by: Markus W. Scherer
17 */
18
19 #include <stdio.h>
20 #include "unicode/utypes.h"
21 #include "unicode/utf8.h"
22 #include "utrie2.h"
23 #include "utrie.h"
24 #include "cstring.h"
25 #include "cmemory.h"
26 #include "udataswp.h"
27 #include "cintltst.h"
28
29 void addTrie2Test(TestNode** root);
30
31 /* Values for setting possibly overlapping, out-of-order ranges of values */
32 typedef struct SetRange {
33 UChar32 start, limit;
34 uint32_t value;
35 UBool overwrite;
36 } SetRange;
37
38 /*
39 * Values for testing:
40 * value is set from the previous boundary's limit to before
41 * this boundary's limit
42 *
43 * There must be an entry with limit 0 and the intialValue.
44 * It may be preceded by an entry with negative limit and the errorValue.
45 */
46 typedef struct CheckRange {
47 UChar32 limit;
48 uint32_t value;
49 } CheckRange;
50
51 static int32_t
skipSpecialValues(const CheckRange checkRanges[],int32_t countCheckRanges)52 skipSpecialValues(const CheckRange checkRanges[], int32_t countCheckRanges) {
53 int32_t i;
54 for(i=0; i<countCheckRanges && checkRanges[i].limit<=0; ++i) {}
55 return i;
56 }
57
58 static int32_t
getSpecialValues(const CheckRange checkRanges[],int32_t countCheckRanges,uint32_t * pInitialValue,uint32_t * pErrorValue)59 getSpecialValues(const CheckRange checkRanges[], int32_t countCheckRanges,
60 uint32_t *pInitialValue, uint32_t *pErrorValue) {
61 int32_t i=0;
62 if(i<countCheckRanges && checkRanges[i].limit<0) {
63 *pErrorValue=checkRanges[i++].value;
64 } else {
65 *pErrorValue=0xbad;
66 }
67 if(i<countCheckRanges && checkRanges[i].limit==0) {
68 *pInitialValue=checkRanges[i++].value;
69 } else {
70 *pInitialValue=0;
71 }
72 return i;
73 }
74
75 /* utrie2_enum() callback, modifies a value */
76 static uint32_t U_CALLCONV
testEnumValue(const void * context,uint32_t value)77 testEnumValue(const void *context, uint32_t value) {
78 return value^0x5555;
79 }
80
81 /* utrie2_enum() callback, verifies a range */
82 static UBool U_CALLCONV
testEnumRange(const void * context,UChar32 start,UChar32 end,uint32_t value)83 testEnumRange(const void *context, UChar32 start, UChar32 end, uint32_t value) {
84 const CheckRange **pb=(const CheckRange **)context;
85 const CheckRange *b=(*pb)++;
86 UChar32 limit=end+1;
87
88 value^=0x5555;
89 if(start!=(b-1)->limit || limit!=b->limit || value!=b->value) {
90 log_err("error: utrie2_enum() delivers wrong range [U+%04lx..U+%04lx].0x%lx instead of [U+%04lx..U+%04lx].0x%lx\n",
91 (long)start, (long)end, (long)value,
92 (long)(b-1)->limit, (long)b->limit-1, (long)b->value);
93 }
94 return TRUE;
95 }
96
97 static void
testTrieEnum(const char * testName,const UTrie2 * trie,const CheckRange checkRanges[],int32_t countCheckRanges)98 testTrieEnum(const char *testName,
99 const UTrie2 *trie,
100 const CheckRange checkRanges[], int32_t countCheckRanges) {
101 /* skip over special values */
102 while(countCheckRanges>0 && checkRanges[0].limit<=0) {
103 ++checkRanges;
104 --countCheckRanges;
105 }
106 utrie2_enum(trie, testEnumValue, testEnumRange, &checkRanges);
107 }
108
109 /* verify all expected values via UTRIE2_GETxx() */
110 static void
testTrieGetters(const char * testName,const UTrie2 * trie,UTrie2ValueBits valueBits,const CheckRange checkRanges[],int32_t countCheckRanges)111 testTrieGetters(const char *testName,
112 const UTrie2 *trie, UTrie2ValueBits valueBits,
113 const CheckRange checkRanges[], int32_t countCheckRanges) {
114 uint32_t initialValue, errorValue;
115 uint32_t value, value2;
116 UChar32 start, limit;
117 int32_t i, countSpecials;
118
119 UBool isFrozen=utrie2_isFrozen(trie);
120 const char *const typeName= isFrozen ? "frozen trie" : "newTrie";
121
122 countSpecials=getSpecialValues(checkRanges, countCheckRanges, &initialValue, &errorValue);
123
124 start=0;
125 for(i=countSpecials; i<countCheckRanges; ++i) {
126 limit=checkRanges[i].limit;
127 value=checkRanges[i].value;
128
129 while(start<limit) {
130 if(isFrozen) {
131 if(start<=0xffff) {
132 if(!U_IS_LEAD(start)) {
133 if(valueBits==UTRIE2_16_VALUE_BITS) {
134 value2=UTRIE2_GET16_FROM_U16_SINGLE_LEAD(trie, start);
135 } else {
136 value2=UTRIE2_GET32_FROM_U16_SINGLE_LEAD(trie, start);
137 }
138 if(value!=value2) {
139 log_err("error: %s(%s).fromBMP(U+%04lx)==0x%lx instead of 0x%lx\n",
140 typeName, testName, (long)start, (long)value2, (long)value);
141 }
142 }
143 } else {
144 if(valueBits==UTRIE2_16_VALUE_BITS) {
145 value2=UTRIE2_GET16_FROM_SUPP(trie, start);
146 } else {
147 value2=UTRIE2_GET32_FROM_SUPP(trie, start);
148 }
149 if(value!=value2) {
150 log_err("error: %s(%s).fromSupp(U+%04lx)==0x%lx instead of 0x%lx\n",
151 typeName, testName, (long)start, (long)value2, (long)value);
152 }
153 }
154 if(valueBits==UTRIE2_16_VALUE_BITS) {
155 value2=UTRIE2_GET16(trie, start);
156 } else {
157 value2=UTRIE2_GET32(trie, start);
158 }
159 if(value!=value2) {
160 log_err("error: %s(%s).get(U+%04lx)==0x%lx instead of 0x%lx\n",
161 typeName, testName, (long)start, (long)value2, (long)value);
162 }
163 }
164 value2=utrie2_get32(trie, start);
165 if(value!=value2) {
166 log_err("error: %s(%s).get32(U+%04lx)==0x%lx instead of 0x%lx\n",
167 typeName, testName, (long)start, (long)value2, (long)value);
168 }
169 ++start;
170 }
171 }
172
173 if(isFrozen) {
174 /* test linear ASCII range from the data array pointer (access to "internal" field) */
175 start=0;
176 for(i=countSpecials; i<countCheckRanges && start<=0x7f; ++i) {
177 limit=checkRanges[i].limit;
178 value=checkRanges[i].value;
179
180 while(start<limit && start<=0x7f) {
181 if(valueBits==UTRIE2_16_VALUE_BITS) {
182 value2=trie->data16[start];
183 } else {
184 value2=trie->data32[start];
185 }
186 if(value!=value2) {
187 log_err("error: %s(%s).asciiData[U+%04lx]==0x%lx instead of 0x%lx\n",
188 typeName, testName, (long)start, (long)value2, (long)value);
189 }
190 ++start;
191 }
192 }
193 while(start<=0xbf) {
194 if(valueBits==UTRIE2_16_VALUE_BITS) {
195 value2=trie->data16[start];
196 } else {
197 value2=trie->data32[start];
198 }
199 if(errorValue!=value2) {
200 log_err("error: %s(%s).badData[U+%04lx]==0x%lx instead of 0x%lx\n",
201 typeName, testName, (long)start, (long)value2, (long)errorValue);
202 }
203 ++start;
204 }
205 }
206
207 if(0!=strncmp(testName, "dummy", 5) && 0!=strncmp(testName, "trie1", 5)) {
208 /* test values for lead surrogate code units */
209 for(start=0xd7ff; start<0xdc01; ++start) {
210 switch(start) {
211 case 0xd7ff:
212 case 0xdc00:
213 value=errorValue;
214 break;
215 case 0xd800:
216 value=90;
217 break;
218 case 0xd999:
219 value=94;
220 break;
221 case 0xdbff:
222 value=99;
223 break;
224 default:
225 value=initialValue;
226 break;
227 }
228 if(isFrozen && U_IS_LEAD(start)) {
229 if(valueBits==UTRIE2_16_VALUE_BITS) {
230 value2=UTRIE2_GET16_FROM_U16_SINGLE_LEAD(trie, start);
231 } else {
232 value2=UTRIE2_GET32_FROM_U16_SINGLE_LEAD(trie, start);
233 }
234 if(value2!=value) {
235 log_err("error: %s(%s).LSCU(U+%04lx)==0x%lx instead of 0x%lx\n",
236 typeName, testName, (long)start, (long)value2, (long)value);
237 }
238 }
239 value2=utrie2_get32FromLeadSurrogateCodeUnit(trie, start);
240 if(value2!=value) {
241 log_err("error: %s(%s).lscu(U+%04lx)==0x%lx instead of 0x%lx\n",
242 typeName, testName, (long)start, (long)value2, (long)value);
243 }
244 }
245 }
246
247 /* test errorValue */
248 if(isFrozen) {
249 if(valueBits==UTRIE2_16_VALUE_BITS) {
250 value=UTRIE2_GET16(trie, -1);
251 value2=UTRIE2_GET16(trie, 0x110000);
252 } else {
253 value=UTRIE2_GET32(trie, -1);
254 value2=UTRIE2_GET32(trie, 0x110000);
255 }
256 if(value!=errorValue || value2!=errorValue) {
257 log_err("error: %s(%s).get(out of range) != errorValue\n",
258 typeName, testName);
259 }
260 }
261 value=utrie2_get32(trie, -1);
262 value2=utrie2_get32(trie, 0x110000);
263 if(value!=errorValue || value2!=errorValue) {
264 log_err("error: %s(%s).get32(out of range) != errorValue\n",
265 typeName, testName);
266 }
267 }
268
269 static void
testTrieUTF16(const char * testName,const UTrie2 * trie,UTrie2ValueBits valueBits,const CheckRange checkRanges[],int32_t countCheckRanges)270 testTrieUTF16(const char *testName,
271 const UTrie2 *trie, UTrie2ValueBits valueBits,
272 const CheckRange checkRanges[], int32_t countCheckRanges) {
273 UChar s[200];
274 uint32_t values[100];
275
276 const UChar *p, *limit;
277
278 uint32_t value;
279 UChar32 prevCP, c, c2;
280 int32_t i, length, sIndex, countValues;
281
282 /* write a string */
283 prevCP=0;
284 length=countValues=0;
285 for(i=skipSpecialValues(checkRanges, countCheckRanges); i<countCheckRanges; ++i) {
286 value=checkRanges[i].value;
287 /* write three code points */
288 U16_APPEND_UNSAFE(s, length, prevCP); /* start of the range */
289 values[countValues++]=value;
290 c=checkRanges[i].limit;
291 prevCP=(prevCP+c)/2; /* middle of the range */
292 U16_APPEND_UNSAFE(s, length, prevCP);
293 values[countValues++]=value;
294 prevCP=c;
295 --c; /* end of the range */
296 U16_APPEND_UNSAFE(s, length, c);
297 values[countValues++]=value;
298 }
299 limit=s+length;
300
301 /* try forward */
302 p=s;
303 i=0;
304 while(p<limit) {
305 sIndex=(int32_t)(p-s);
306 U16_NEXT(s, sIndex, length, c2);
307 c=0x33;
308 if(valueBits==UTRIE2_16_VALUE_BITS) {
309 UTRIE2_U16_NEXT16(trie, p, limit, c, value);
310 } else {
311 UTRIE2_U16_NEXT32(trie, p, limit, c, value);
312 }
313 if(value!=values[i]) {
314 log_err("error: wrong value from UTRIE2_NEXT(%s)(U+%04lx): 0x%lx instead of 0x%lx\n",
315 testName, (long)c, (long)value, (long)values[i]);
316 }
317 if(c!=c2) {
318 log_err("error: wrong code point from UTRIE2_NEXT(%s): U+%04lx != U+%04lx\n",
319 testName, (long)c, (long)c2);
320 continue;
321 }
322 ++i;
323 }
324
325 /* try backward */
326 p=limit;
327 i=countValues;
328 while(s<p) {
329 --i;
330 sIndex=(int32_t)(p-s);
331 U16_PREV(s, 0, sIndex, c2);
332 c=0x33;
333 if(valueBits==UTRIE2_16_VALUE_BITS) {
334 UTRIE2_U16_PREV16(trie, s, p, c, value);
335 } else {
336 UTRIE2_U16_PREV32(trie, s, p, c, value);
337 }
338 if(value!=values[i]) {
339 log_err("error: wrong value from UTRIE2_PREV(%s)(U+%04lx): 0x%lx instead of 0x%lx\n",
340 testName, (long)c, (long)value, (long)values[i]);
341 }
342 if(c!=c2) {
343 log_err("error: wrong code point from UTRIE2_PREV(%s): U+%04lx != U+%04lx\n",
344 testName, c, c2);
345 }
346 }
347 }
348
349 static void
testTrieUTF8(const char * testName,const UTrie2 * trie,UTrie2ValueBits valueBits,const CheckRange checkRanges[],int32_t countCheckRanges)350 testTrieUTF8(const char *testName,
351 const UTrie2 *trie, UTrie2ValueBits valueBits,
352 const CheckRange checkRanges[], int32_t countCheckRanges) {
353 // Note: The byte sequence comments refer to the original UTF-8 definition.
354 // Starting with ICU 60, any sequence that is not a prefix of a valid one
355 // is treated as multiple single-byte errors.
356 // For testing, we only rely on U8_... and UTrie2 UTF-8 macros
357 // iterating consistently.
358 static const uint8_t illegal[]={
359 0xc0, 0x80, /* non-shortest U+0000 */
360 0xc1, 0xbf, /* non-shortest U+007f */
361 0xc2, /* truncated */
362 0xe0, 0x90, 0x80, /* non-shortest U+0400 */
363 0xe0, 0xa0, /* truncated */
364 0xed, 0xa0, 0x80, /* lead surrogate U+d800 */
365 0xed, 0xbf, 0xbf, /* trail surrogate U+dfff */
366 0xf0, 0x8f, 0xbf, 0xbf, /* non-shortest U+ffff */
367 0xf0, 0x90, 0x80, /* truncated */
368 0xf4, 0x90, 0x80, 0x80, /* beyond-Unicode U+110000 */
369 0xf8, 0x80, 0x80, 0x80, /* truncated */
370 0xf8, 0x80, 0x80, 0x80, 0x80, /* 5-byte UTF-8 */
371 0xfd, 0xbf, 0xbf, 0xbf, 0xbf, /* truncated */
372 0xfd, 0xbf, 0xbf, 0xbf, 0xbf, 0xbf, /* 6-byte UTF-8 */
373 0xfe,
374 0xff
375 };
376 uint8_t s[600];
377 uint32_t values[200];
378
379 const uint8_t *p, *limit;
380
381 uint32_t initialValue, errorValue;
382 uint32_t value, bytes;
383 UChar32 prevCP, c;
384 int32_t i, countSpecials, length, countValues;
385 int32_t prev8, i8;
386
387 countSpecials=getSpecialValues(checkRanges, countCheckRanges, &initialValue, &errorValue);
388
389 /* write a string */
390 prevCP=0;
391 length=countValues=0;
392 /* first a couple of trail bytes in lead position */
393 s[length++]=0x80;
394 values[countValues++]=errorValue;
395 s[length++]=0xbf;
396 values[countValues++]=errorValue;
397 prev8=i8=0;
398 for(i=countSpecials; i<countCheckRanges; ++i) {
399 value=checkRanges[i].value;
400 /* write three legal (or surrogate) code points */
401 U8_APPEND_UNSAFE(s, length, prevCP); /* start of the range */
402 if(U_IS_SURROGATE(prevCP)) {
403 // A surrogate byte sequence counts as 3 single-byte errors.
404 values[countValues++]=errorValue;
405 values[countValues++]=errorValue;
406 values[countValues++]=errorValue;
407 } else {
408 values[countValues++]=value;
409 }
410 c=checkRanges[i].limit;
411 prevCP=(prevCP+c)/2; /* middle of the range */
412 U8_APPEND_UNSAFE(s, length, prevCP);
413 if(U_IS_SURROGATE(prevCP)) {
414 // A surrogate byte sequence counts as 3 single-byte errors.
415 values[countValues++]=errorValue;
416 values[countValues++]=errorValue;
417 values[countValues++]=errorValue;
418 } else {
419 values[countValues++]=value;
420 }
421 prevCP=c;
422 --c; /* end of the range */
423 U8_APPEND_UNSAFE(s, length, c);
424 if(U_IS_SURROGATE(c)) {
425 // A surrogate byte sequence counts as 3 single-byte errors.
426 values[countValues++]=errorValue;
427 values[countValues++]=errorValue;
428 values[countValues++]=errorValue;
429 } else {
430 values[countValues++]=value;
431 }
432 /* write an illegal byte sequence */
433 if(i8<sizeof(illegal)) {
434 U8_FWD_1(illegal, i8, sizeof(illegal));
435 while(prev8<i8) {
436 s[length++]=illegal[prev8++];
437 }
438 values[countValues++]=errorValue;
439 }
440 }
441 /* write the remaining illegal byte sequences */
442 while(i8<sizeof(illegal)) {
443 U8_FWD_1(illegal, i8, sizeof(illegal));
444 while(prev8<i8) {
445 s[length++]=illegal[prev8++];
446 }
447 values[countValues++]=errorValue;
448 }
449 limit=s+length;
450
451 /* try forward */
452 p=s;
453 i=0;
454 while(p<limit) {
455 prev8=i8=(int32_t)(p-s);
456 U8_NEXT(s, i8, length, c);
457 if(valueBits==UTRIE2_16_VALUE_BITS) {
458 UTRIE2_U8_NEXT16(trie, p, limit, value);
459 } else {
460 UTRIE2_U8_NEXT32(trie, p, limit, value);
461 }
462 bytes=0;
463 if(value!=values[i] || i8!=(p-s)) {
464 int32_t k=prev8;
465 while(k<i8) {
466 bytes=(bytes<<8)|s[k++];
467 }
468 }
469 if(value!=values[i]) {
470 log_err("error: wrong value from UTRIE2_U8_NEXT(%s)(from %d %lx->U+%04lx) (read %d bytes): "
471 "0x%lx instead of 0x%lx\n",
472 testName, (int)prev8, (unsigned long)bytes, (long)c, (int)((p-s)-prev8),
473 (long)value, (long)values[i]);
474 }
475 if(i8!=(p-s)) {
476 log_err("error: wrong end index from UTRIE2_U8_NEXT(%s)(from %d %lx->U+%04lx): %ld != %ld\n",
477 testName, (int)prev8, (unsigned long)bytes, (long)c, (long)(p-s), (long)i8);
478 continue;
479 }
480 ++i;
481 }
482
483 /* try backward */
484 p=limit;
485 i=countValues;
486 while(s<p) {
487 --i;
488 prev8=i8=(int32_t)(p-s);
489 U8_PREV(s, 0, i8, c);
490 if(valueBits==UTRIE2_16_VALUE_BITS) {
491 UTRIE2_U8_PREV16(trie, s, p, value);
492 } else {
493 UTRIE2_U8_PREV32(trie, s, p, value);
494 }
495 bytes=0;
496 if(value!=values[i] || i8!=(p-s)) {
497 int32_t k=i8;
498 while(k<prev8) {
499 bytes=(bytes<<8)|s[k++];
500 }
501 }
502 if(value!=values[i]) {
503 log_err("error: wrong value from UTRIE2_U8_PREV(%s)(from %d %lx->U+%04lx) (read %d bytes): "
504 ": 0x%lx instead of 0x%lx\n",
505 testName, (int)prev8, (unsigned long)bytes, (long)c, (int)(prev8-(p-s)),
506 (long)value, (long)values[i]);
507 }
508 if(i8!=(p-s)) {
509 log_err("error: wrong end index from UTRIE2_U8_PREV(%s)(from %d %lx->U+%04lx): %ld != %ld\n",
510 testName, (int)prev8, (unsigned long)bytes, (long)c, (long)(p-s), (long)i8);
511 continue;
512 }
513 }
514 }
515
516 static void
testFrozenTrie(const char * testName,UTrie2 * trie,UTrie2ValueBits valueBits,const CheckRange checkRanges[],int32_t countCheckRanges)517 testFrozenTrie(const char *testName,
518 UTrie2 *trie, UTrie2ValueBits valueBits,
519 const CheckRange checkRanges[], int32_t countCheckRanges) {
520 UErrorCode errorCode;
521 uint32_t value, value2;
522
523 if(!utrie2_isFrozen(trie)) {
524 log_err("error: utrie2_isFrozen(frozen %s) returned FALSE (not frozen)\n",
525 testName);
526 return;
527 }
528
529 testTrieGetters(testName, trie, valueBits, checkRanges, countCheckRanges);
530 testTrieEnum(testName, trie, checkRanges, countCheckRanges);
531 testTrieUTF16(testName, trie, valueBits, checkRanges, countCheckRanges);
532 testTrieUTF8(testName, trie, valueBits, checkRanges, countCheckRanges);
533
534 errorCode=U_ZERO_ERROR;
535 value=utrie2_get32(trie, 1);
536 utrie2_set32(trie, 1, 234, &errorCode);
537 value2=utrie2_get32(trie, 1);
538 if(errorCode!=U_NO_WRITE_PERMISSION || value2!=value) {
539 log_err("error: utrie2_set32(frozen %s) failed: it set %s != U_NO_WRITE_PERMISSION\n",
540 testName, u_errorName(errorCode));
541 return;
542 }
543
544 errorCode=U_ZERO_ERROR;
545 utrie2_setRange32(trie, 1, 5, 234, TRUE, &errorCode);
546 value2=utrie2_get32(trie, 1);
547 if(errorCode!=U_NO_WRITE_PERMISSION || value2!=value) {
548 log_err("error: utrie2_setRange32(frozen %s) failed: it set %s != U_NO_WRITE_PERMISSION\n",
549 testName, u_errorName(errorCode));
550 return;
551 }
552
553 errorCode=U_ZERO_ERROR;
554 value=utrie2_get32FromLeadSurrogateCodeUnit(trie, 0xd801);
555 utrie2_set32ForLeadSurrogateCodeUnit(trie, 0xd801, 234, &errorCode);
556 value2=utrie2_get32FromLeadSurrogateCodeUnit(trie, 0xd801);
557 if(errorCode!=U_NO_WRITE_PERMISSION || value2!=value) {
558 log_err("error: utrie2_set32ForLeadSurrogateCodeUnit(frozen %s) failed: "
559 "it set %s != U_NO_WRITE_PERMISSION\n",
560 testName, u_errorName(errorCode));
561 return;
562 }
563 }
564
565 static void
testNewTrie(const char * testName,const UTrie2 * trie,const CheckRange checkRanges[],int32_t countCheckRanges)566 testNewTrie(const char *testName, const UTrie2 *trie,
567 const CheckRange checkRanges[], int32_t countCheckRanges) {
568 /* The valueBits are ignored for an unfrozen trie. */
569 testTrieGetters(testName, trie, UTRIE2_COUNT_VALUE_BITS, checkRanges, countCheckRanges);
570 testTrieEnum(testName, trie, checkRanges, countCheckRanges);
571 }
572
573 static void
testTrieSerialize(const char * testName,UTrie2 * trie,UTrie2ValueBits valueBits,UBool withSwap,const CheckRange checkRanges[],int32_t countCheckRanges)574 testTrieSerialize(const char *testName,
575 UTrie2 *trie, UTrie2ValueBits valueBits,
576 UBool withSwap,
577 const CheckRange checkRanges[], int32_t countCheckRanges) {
578 uint32_t storage[10000];
579 int32_t length1, length2, length3;
580 UTrie2ValueBits otherValueBits;
581 UErrorCode errorCode;
582
583 /* clone the trie so that the caller can reuse the original */
584 errorCode=U_ZERO_ERROR;
585 trie=utrie2_clone(trie, &errorCode);
586 if(U_FAILURE(errorCode)) {
587 log_err("error: utrie2_clone(unfrozen %s) failed - %s\n",
588 testName, u_errorName(errorCode));
589 return;
590 }
591
592 /*
593 * This is not a loop, but simply a block that we can exit with "break"
594 * when something goes wrong.
595 */
596 do {
597 errorCode=U_ZERO_ERROR;
598 utrie2_serialize(trie, storage, sizeof(storage), &errorCode);
599 if(errorCode!=U_ILLEGAL_ARGUMENT_ERROR) {
600 log_err("error: utrie2_serialize(unfrozen %s) set %s != U_ILLEGAL_ARGUMENT_ERROR\n",
601 testName, u_errorName(errorCode));
602 break;
603 }
604 errorCode=U_ZERO_ERROR;
605 utrie2_freeze(trie, valueBits, &errorCode);
606 if(U_FAILURE(errorCode) || !utrie2_isFrozen(trie)) {
607 log_err("error: utrie2_freeze(%s) failed: %s isFrozen: %d\n",
608 testName, u_errorName(errorCode), utrie2_isFrozen(trie));
609 break;
610 }
611 otherValueBits= valueBits==UTRIE2_16_VALUE_BITS ? UTRIE2_32_VALUE_BITS : UTRIE2_16_VALUE_BITS;
612 utrie2_freeze(trie, otherValueBits, &errorCode);
613 if(errorCode!=U_ILLEGAL_ARGUMENT_ERROR) {
614 log_err("error: utrie2_freeze(already-frozen with other valueBits %s) "
615 "set %s != U_ILLEGAL_ARGUMENT_ERROR\n",
616 testName, u_errorName(errorCode));
617 break;
618 }
619 errorCode=U_ZERO_ERROR;
620 if(withSwap) {
621 /* clone a frozen trie */
622 UTrie2 *clone=utrie2_clone(trie, &errorCode);
623 if(U_FAILURE(errorCode)) {
624 log_err("error: cloning a frozen UTrie2 failed (%s) - %s\n",
625 testName, u_errorName(errorCode));
626 errorCode=U_ZERO_ERROR; /* continue with the original */
627 } else {
628 utrie2_close(trie);
629 trie=clone;
630 }
631 }
632 length1=utrie2_serialize(trie, NULL, 0, &errorCode);
633 if(errorCode!=U_BUFFER_OVERFLOW_ERROR) {
634 log_err("error: utrie2_serialize(%s) preflighting set %s != U_BUFFER_OVERFLOW_ERROR\n",
635 testName, u_errorName(errorCode));
636 break;
637 }
638 errorCode=U_ZERO_ERROR;
639 length2=utrie2_serialize(trie, storage, sizeof(storage), &errorCode);
640 if(errorCode==U_BUFFER_OVERFLOW_ERROR) {
641 log_err("error: utrie2_serialize(%s) needs more memory\n", testName);
642 break;
643 }
644 if(U_FAILURE(errorCode)) {
645 log_err("error: utrie2_serialize(%s) failed: %s\n", testName, u_errorName(errorCode));
646 break;
647 }
648 if(length1!=length2) {
649 log_err("error: trie serialization (%s) lengths different: "
650 "preflight vs. serialize\n", testName);
651 break;
652 }
653
654 testFrozenTrie(testName, trie, valueBits, checkRanges, countCheckRanges);
655 utrie2_close(trie);
656 trie=NULL;
657
658 if(withSwap) {
659 uint32_t swapped[10000];
660 int32_t swappedLength;
661
662 UDataSwapper *ds;
663
664 /* swap to opposite-endian */
665 uprv_memset(swapped, 0x55, length2);
666 ds=udata_openSwapper(U_IS_BIG_ENDIAN, U_CHARSET_FAMILY,
667 !U_IS_BIG_ENDIAN, U_CHARSET_FAMILY, &errorCode);
668 swappedLength=utrie2_swap(ds, storage, -1, NULL, &errorCode);
669 if(U_FAILURE(errorCode) || swappedLength!=length2) {
670 log_err("error: utrie2_swap(%s to OE preflighting) failed (%s) "
671 "or before/after lengths different\n",
672 testName, u_errorName(errorCode));
673 udata_closeSwapper(ds);
674 break;
675 }
676 swappedLength=utrie2_swap(ds, storage, length2, swapped, &errorCode);
677 udata_closeSwapper(ds);
678 if(U_FAILURE(errorCode) || swappedLength!=length2) {
679 log_err("error: utrie2_swap(%s to OE) failed (%s) or before/after lengths different\n",
680 testName, u_errorName(errorCode));
681 break;
682 }
683
684 /* swap back to platform-endian */
685 uprv_memset(storage, 0xaa, length2);
686 ds=udata_openSwapper(!U_IS_BIG_ENDIAN, U_CHARSET_FAMILY,
687 U_IS_BIG_ENDIAN, U_CHARSET_FAMILY, &errorCode);
688 swappedLength=utrie2_swap(ds, swapped, -1, NULL, &errorCode);
689 if(U_FAILURE(errorCode) || swappedLength!=length2) {
690 log_err("error: utrie2_swap(%s to PE preflighting) failed (%s) "
691 "or before/after lengths different\n",
692 testName, u_errorName(errorCode));
693 udata_closeSwapper(ds);
694 break;
695 }
696 swappedLength=utrie2_swap(ds, swapped, length2, storage, &errorCode);
697 udata_closeSwapper(ds);
698 if(U_FAILURE(errorCode) || swappedLength!=length2) {
699 log_err("error: utrie2_swap(%s to PE) failed (%s) or before/after lengths different\n",
700 testName, u_errorName(errorCode));
701 break;
702 }
703 }
704
705 trie=utrie2_openFromSerialized(valueBits, storage, length2, &length3, &errorCode);
706 if(U_FAILURE(errorCode)) {
707 log_err("error: utrie2_openFromSerialized(%s) failed, %s\n", testName, u_errorName(errorCode));
708 break;
709 }
710 if((valueBits==UTRIE2_16_VALUE_BITS)!=(trie->data32==NULL)) {
711 log_err("error: trie serialization (%s) did not preserve 32-bitness\n", testName);
712 break;
713 }
714 if(length2!=length3) {
715 log_err("error: trie serialization (%s) lengths different: "
716 "serialize vs. unserialize\n", testName);
717 break;
718 }
719 /* overwrite the storage that is not supposed to be needed */
720 uprv_memset((char *)storage+length3, 0xfa, (int32_t)(sizeof(storage)-length3));
721
722 utrie2_freeze(trie, valueBits, &errorCode);
723 if(U_FAILURE(errorCode) || !utrie2_isFrozen(trie)) {
724 log_err("error: utrie2_freeze(unserialized %s) failed: %s isFrozen: %d\n",
725 testName, u_errorName(errorCode), utrie2_isFrozen(trie));
726 break;
727 }
728 utrie2_freeze(trie, otherValueBits, &errorCode);
729 if(errorCode!=U_ILLEGAL_ARGUMENT_ERROR) {
730 log_err("error: utrie2_freeze(unserialized with other valueBits %s) "
731 "set %s != U_ILLEGAL_ARGUMENT_ERROR\n",
732 testName, u_errorName(errorCode));
733 break;
734 }
735 errorCode=U_ZERO_ERROR;
736 if(withSwap) {
737 /* clone an unserialized trie */
738 UTrie2 *clone=utrie2_clone(trie, &errorCode);
739 if(U_FAILURE(errorCode)) {
740 log_err("error: utrie2_clone(unserialized %s) failed - %s\n",
741 testName, u_errorName(errorCode));
742 errorCode=U_ZERO_ERROR;
743 /* no need to break: just test the original trie */
744 } else {
745 utrie2_close(trie);
746 trie=clone;
747 uprv_memset(storage, 0, sizeof(storage));
748 }
749 }
750 testFrozenTrie(testName, trie, valueBits, checkRanges, countCheckRanges);
751 {
752 /* clone-as-thawed an unserialized trie */
753 UTrie2 *clone=utrie2_cloneAsThawed(trie, &errorCode);
754 if(U_FAILURE(errorCode) || utrie2_isFrozen(clone)) {
755 log_err("error: utrie2_cloneAsThawed(unserialized %s) failed - "
756 "%s (isFrozen: %d)\n",
757 testName, u_errorName(errorCode), clone!=NULL && utrie2_isFrozen(trie));
758 break;
759 } else {
760 utrie2_close(trie);
761 trie=clone;
762 }
763 }
764 {
765 uint32_t value, value2;
766
767 value=utrie2_get32(trie, 0xa1);
768 utrie2_set32(trie, 0xa1, 789, &errorCode);
769 value2=utrie2_get32(trie, 0xa1);
770 utrie2_set32(trie, 0xa1, value, &errorCode);
771 if(U_FAILURE(errorCode) || value2!=789) {
772 log_err("error: modifying a cloneAsThawed UTrie2 (%s) failed - %s\n",
773 testName, u_errorName(errorCode));
774 }
775 }
776 testNewTrie(testName, trie, checkRanges, countCheckRanges);
777 } while(0);
778
779 utrie2_close(trie);
780 }
781
782 static UTrie2 *
testTrieSerializeAllValueBits(const char * testName,UTrie2 * trie,UBool withClone,const CheckRange checkRanges[],int32_t countCheckRanges)783 testTrieSerializeAllValueBits(const char *testName,
784 UTrie2 *trie, UBool withClone,
785 const CheckRange checkRanges[], int32_t countCheckRanges) {
786 char name[40];
787
788 /* verify that all the expected values are in the unfrozen trie */
789 testNewTrie(testName, trie, checkRanges, countCheckRanges);
790
791 /*
792 * Test with both valueBits serializations,
793 * and that utrie2_serialize() can be called multiple times.
794 */
795 uprv_strcpy(name, testName);
796 uprv_strcat(name, ".16");
797 testTrieSerialize(name, trie,
798 UTRIE2_16_VALUE_BITS, withClone,
799 checkRanges, countCheckRanges);
800
801 if(withClone) {
802 /*
803 * try cloning after the first serialization;
804 * clone-as-thawed just to sometimes try it on an unfrozen trie
805 */
806 UErrorCode errorCode=U_ZERO_ERROR;
807 UTrie2 *clone=utrie2_cloneAsThawed(trie, &errorCode);
808 if(U_FAILURE(errorCode)) {
809 log_err("error: utrie2_cloneAsThawed(%s) after serialization failed - %s\n",
810 testName, u_errorName(errorCode));
811 } else {
812 utrie2_close(trie);
813 trie=clone;
814
815 testNewTrie(testName, trie, checkRanges, countCheckRanges);
816 }
817 }
818
819 uprv_strcpy(name, testName);
820 uprv_strcat(name, ".32");
821 testTrieSerialize(name, trie,
822 UTRIE2_32_VALUE_BITS, withClone,
823 checkRanges, countCheckRanges);
824
825 return trie; /* could be the clone */
826 }
827
828 static UTrie2 *
makeTrieWithRanges(const char * testName,UBool withClone,const SetRange setRanges[],int32_t countSetRanges,const CheckRange checkRanges[],int32_t countCheckRanges)829 makeTrieWithRanges(const char *testName, UBool withClone,
830 const SetRange setRanges[], int32_t countSetRanges,
831 const CheckRange checkRanges[], int32_t countCheckRanges) {
832 UTrie2 *trie;
833 uint32_t initialValue, errorValue;
834 uint32_t value;
835 UChar32 start, limit;
836 int32_t i;
837 UErrorCode errorCode;
838 UBool overwrite;
839
840 log_verbose("\ntesting Trie '%s'\n", testName);
841 errorCode=U_ZERO_ERROR;
842 getSpecialValues(checkRanges, countCheckRanges, &initialValue, &errorValue);
843 trie=utrie2_open(initialValue, errorValue, &errorCode);
844 if(U_FAILURE(errorCode)) {
845 log_err("error: utrie2_open(%s) failed: %s\n", testName, u_errorName(errorCode));
846 return NULL;
847 }
848
849 /* set values from setRanges[] */
850 for(i=0; i<countSetRanges; ++i) {
851 if(withClone && i==countSetRanges/2) {
852 /* switch to a clone in the middle of setting values */
853 UTrie2 *clone=utrie2_clone(trie, &errorCode);
854 if(U_FAILURE(errorCode)) {
855 log_err("error: utrie2_clone(%s) failed - %s\n",
856 testName, u_errorName(errorCode));
857 errorCode=U_ZERO_ERROR; /* continue with the original */
858 } else {
859 utrie2_close(trie);
860 trie=clone;
861 }
862 }
863 start=setRanges[i].start;
864 limit=setRanges[i].limit;
865 value=setRanges[i].value;
866 overwrite=setRanges[i].overwrite;
867 if((limit-start)==1 && overwrite) {
868 utrie2_set32(trie, start, value, &errorCode);
869 } else {
870 utrie2_setRange32(trie, start, limit-1, value, overwrite, &errorCode);
871 }
872 }
873
874 /* set some values for lead surrogate code units */
875 utrie2_set32ForLeadSurrogateCodeUnit(trie, 0xd800, 90, &errorCode);
876 utrie2_set32ForLeadSurrogateCodeUnit(trie, 0xd999, 94, &errorCode);
877 utrie2_set32ForLeadSurrogateCodeUnit(trie, 0xdbff, 99, &errorCode);
878 if(U_SUCCESS(errorCode)) {
879 return trie;
880 } else {
881 log_err("error: setting values into a trie (%s) failed - %s\n",
882 testName, u_errorName(errorCode));
883 utrie2_close(trie);
884 return NULL;
885 }
886 }
887
888 static void
testTrieRanges(const char * testName,UBool withClone,const SetRange setRanges[],int32_t countSetRanges,const CheckRange checkRanges[],int32_t countCheckRanges)889 testTrieRanges(const char *testName, UBool withClone,
890 const SetRange setRanges[], int32_t countSetRanges,
891 const CheckRange checkRanges[], int32_t countCheckRanges) {
892 UTrie2 *trie=makeTrieWithRanges(testName, withClone,
893 setRanges, countSetRanges,
894 checkRanges, countCheckRanges);
895 if(trie!=NULL) {
896 trie=testTrieSerializeAllValueBits(testName, trie, withClone,
897 checkRanges, countCheckRanges);
898 utrie2_close(trie);
899 }
900 }
901
902 /* test data ----------------------------------------------------------------*/
903
904 /* set consecutive ranges, even with value 0 */
905 static const SetRange
906 setRanges1[]={
907 { 0, 0x40, 0, FALSE },
908 { 0x40, 0xe7, 0x1234, FALSE },
909 { 0xe7, 0x3400, 0, FALSE },
910 { 0x3400, 0x9fa6, 0x6162, FALSE },
911 { 0x9fa6, 0xda9e, 0x3132, FALSE },
912 { 0xdada, 0xeeee, 0x87ff, FALSE },
913 { 0xeeee, 0x11111, 1, FALSE },
914 { 0x11111, 0x44444, 0x6162, FALSE },
915 { 0x44444, 0x60003, 0, FALSE },
916 { 0xf0003, 0xf0004, 0xf, FALSE },
917 { 0xf0004, 0xf0006, 0x10, FALSE },
918 { 0xf0006, 0xf0007, 0x11, FALSE },
919 { 0xf0007, 0xf0040, 0x12, FALSE },
920 { 0xf0040, 0x110000, 0, FALSE }
921 };
922
923 static const CheckRange
924 checkRanges1[]={
925 { 0, 0 },
926 { 0x40, 0 },
927 { 0xe7, 0x1234 },
928 { 0x3400, 0 },
929 { 0x9fa6, 0x6162 },
930 { 0xda9e, 0x3132 },
931 { 0xdada, 0 },
932 { 0xeeee, 0x87ff },
933 { 0x11111, 1 },
934 { 0x44444, 0x6162 },
935 { 0xf0003, 0 },
936 { 0xf0004, 0xf },
937 { 0xf0006, 0x10 },
938 { 0xf0007, 0x11 },
939 { 0xf0040, 0x12 },
940 { 0x110000, 0 }
941 };
942
943 /* set some interesting overlapping ranges */
944 static const SetRange
945 setRanges2[]={
946 { 0x21, 0x7f, 0x5555, TRUE },
947 { 0x2f800, 0x2fedc, 0x7a, TRUE },
948 { 0x72, 0xdd, 3, TRUE },
949 { 0xdd, 0xde, 4, FALSE },
950 { 0x201, 0x240, 6, TRUE }, /* 3 consecutive blocks with the same pattern but */
951 { 0x241, 0x280, 6, TRUE }, /* discontiguous value ranges, testing utrie2_enum() */
952 { 0x281, 0x2c0, 6, TRUE },
953 { 0x2f987, 0x2fa98, 5, TRUE },
954 { 0x2f777, 0x2f883, 0, TRUE },
955 { 0x2f900, 0x2ffaa, 1, FALSE },
956 { 0x2ffaa, 0x2ffab, 2, TRUE },
957 { 0x2ffbb, 0x2ffc0, 7, TRUE }
958 };
959
960 static const CheckRange
961 checkRanges2[]={
962 { 0, 0 },
963 { 0x21, 0 },
964 { 0x72, 0x5555 },
965 { 0xdd, 3 },
966 { 0xde, 4 },
967 { 0x201, 0 },
968 { 0x240, 6 },
969 { 0x241, 0 },
970 { 0x280, 6 },
971 { 0x281, 0 },
972 { 0x2c0, 6 },
973 { 0x2f883, 0 },
974 { 0x2f987, 0x7a },
975 { 0x2fa98, 5 },
976 { 0x2fedc, 0x7a },
977 { 0x2ffaa, 1 },
978 { 0x2ffab, 2 },
979 { 0x2ffbb, 0 },
980 { 0x2ffc0, 7 },
981 { 0x110000, 0 }
982 };
983
984 static const CheckRange
985 checkRanges2_d800[]={
986 { 0x10000, 0 },
987 { 0x10400, 0 }
988 };
989
990 static const CheckRange
991 checkRanges2_d87e[]={
992 { 0x2f800, 6 },
993 { 0x2f883, 0 },
994 { 0x2f987, 0x7a },
995 { 0x2fa98, 5 },
996 { 0x2fc00, 0x7a }
997 };
998
999 static const CheckRange
1000 checkRanges2_d87f[]={
1001 { 0x2fc00, 0 },
1002 { 0x2fedc, 0x7a },
1003 { 0x2ffaa, 1 },
1004 { 0x2ffab, 2 },
1005 { 0x2ffbb, 0 },
1006 { 0x2ffc0, 7 },
1007 { 0x30000, 0 }
1008 };
1009
1010 static const CheckRange
1011 checkRanges2_dbff[]={
1012 { 0x10fc00, 0 },
1013 { 0x110000, 0 }
1014 };
1015
1016 /* use a non-zero initial value */
1017 static const SetRange
1018 setRanges3[]={
1019 { 0x31, 0xa4, 1, FALSE },
1020 { 0x3400, 0x6789, 2, FALSE },
1021 { 0x8000, 0x89ab, 9, TRUE },
1022 { 0x9000, 0xa000, 4, TRUE },
1023 { 0xabcd, 0xbcde, 3, TRUE },
1024 { 0x55555, 0x110000, 6, TRUE }, /* highStart<U+ffff with non-initialValue */
1025 { 0xcccc, 0x55555, 6, TRUE }
1026 };
1027
1028 static const CheckRange
1029 checkRanges3[]={
1030 { 0, 9 }, /* non-zero initialValue */
1031 { 0x31, 9 },
1032 { 0xa4, 1 },
1033 { 0x3400, 9 },
1034 { 0x6789, 2 },
1035 { 0x9000, 9 },
1036 { 0xa000, 4 },
1037 { 0xabcd, 9 },
1038 { 0xbcde, 3 },
1039 { 0xcccc, 9 },
1040 { 0x110000, 6 }
1041 };
1042
1043 /* empty or single-value tries, testing highStart==0 */
1044 static const SetRange
1045 setRangesEmpty[]={
1046 { 0, 0, 0, FALSE }, /* need some values for it to compile */
1047 };
1048
1049 static const CheckRange
1050 checkRangesEmpty[]={
1051 { 0, 3 },
1052 { 0x110000, 3 }
1053 };
1054
1055 static const SetRange
1056 setRangesSingleValue[]={
1057 { 0, 0x110000, 5, TRUE },
1058 };
1059
1060 static const CheckRange
1061 checkRangesSingleValue[]={
1062 { 0, 3 },
1063 { 0x110000, 5 }
1064 };
1065
1066 static void
TrieTest(void)1067 TrieTest(void) {
1068 testTrieRanges("set1", FALSE,
1069 setRanges1, UPRV_LENGTHOF(setRanges1),
1070 checkRanges1, UPRV_LENGTHOF(checkRanges1));
1071 testTrieRanges("set2-overlap", FALSE,
1072 setRanges2, UPRV_LENGTHOF(setRanges2),
1073 checkRanges2, UPRV_LENGTHOF(checkRanges2));
1074 testTrieRanges("set3-initial-9", FALSE,
1075 setRanges3, UPRV_LENGTHOF(setRanges3),
1076 checkRanges3, UPRV_LENGTHOF(checkRanges3));
1077 testTrieRanges("set-empty", FALSE,
1078 setRangesEmpty, 0,
1079 checkRangesEmpty, UPRV_LENGTHOF(checkRangesEmpty));
1080 testTrieRanges("set-single-value", FALSE,
1081 setRangesSingleValue, UPRV_LENGTHOF(setRangesSingleValue),
1082 checkRangesSingleValue, UPRV_LENGTHOF(checkRangesSingleValue));
1083
1084 testTrieRanges("set2-overlap.withClone", TRUE,
1085 setRanges2, UPRV_LENGTHOF(setRanges2),
1086 checkRanges2, UPRV_LENGTHOF(checkRanges2));
1087 }
1088
1089 static void
EnumNewTrieForLeadSurrogateTest(void)1090 EnumNewTrieForLeadSurrogateTest(void) {
1091 static const char *const testName="enum-for-lead";
1092 UTrie2 *trie=makeTrieWithRanges(testName, FALSE,
1093 setRanges2, UPRV_LENGTHOF(setRanges2),
1094 checkRanges2, UPRV_LENGTHOF(checkRanges2));
1095 while(trie!=NULL) {
1096 const CheckRange *checkRanges;
1097
1098 checkRanges=checkRanges2_d800+1;
1099 utrie2_enumForLeadSurrogate(trie, 0xd800,
1100 testEnumValue, testEnumRange,
1101 &checkRanges);
1102 checkRanges=checkRanges2_d87e+1;
1103 utrie2_enumForLeadSurrogate(trie, 0xd87e,
1104 testEnumValue, testEnumRange,
1105 &checkRanges);
1106 checkRanges=checkRanges2_d87f+1;
1107 utrie2_enumForLeadSurrogate(trie, 0xd87f,
1108 testEnumValue, testEnumRange,
1109 &checkRanges);
1110 checkRanges=checkRanges2_dbff+1;
1111 utrie2_enumForLeadSurrogate(trie, 0xdbff,
1112 testEnumValue, testEnumRange,
1113 &checkRanges);
1114 if(!utrie2_isFrozen(trie)) {
1115 UErrorCode errorCode=U_ZERO_ERROR;
1116 utrie2_freeze(trie, UTRIE2_16_VALUE_BITS, &errorCode);
1117 if(U_FAILURE(errorCode)) {
1118 log_err("error: utrie2_freeze(%s) failed\n", testName);
1119 utrie2_close(trie);
1120 return;
1121 }
1122 } else {
1123 utrie2_close(trie);
1124 break;
1125 }
1126 }
1127 }
1128
1129 /* test utrie2_openDummy() -------------------------------------------------- */
1130
1131 static void
dummyTest(UTrie2ValueBits valueBits)1132 dummyTest(UTrie2ValueBits valueBits) {
1133 CheckRange
1134 checkRanges[]={
1135 { -1, 0 },
1136 { 0, 0 },
1137 { 0x110000, 0 }
1138 };
1139
1140 UTrie2 *trie;
1141 UErrorCode errorCode;
1142
1143 const char *testName;
1144 uint32_t initialValue, errorValue;
1145
1146 if(valueBits==UTRIE2_16_VALUE_BITS) {
1147 testName="dummy.16";
1148 initialValue=0x313;
1149 errorValue=0xaffe;
1150 } else {
1151 testName="dummy.32";
1152 initialValue=0x01234567;
1153 errorValue=0x89abcdef;
1154 }
1155 checkRanges[0].value=errorValue;
1156 checkRanges[1].value=checkRanges[2].value=initialValue;
1157
1158 errorCode=U_ZERO_ERROR;
1159 trie=utrie2_openDummy(valueBits, initialValue, errorValue, &errorCode);
1160 if(U_FAILURE(errorCode)) {
1161 log_err("utrie2_openDummy(valueBits=%d) failed - %s\n", valueBits, u_errorName(errorCode));
1162 return;
1163 }
1164
1165 testFrozenTrie(testName, trie, valueBits, checkRanges, UPRV_LENGTHOF(checkRanges));
1166 utrie2_close(trie);
1167 }
1168
1169 static void
DummyTrieTest(void)1170 DummyTrieTest(void) {
1171 dummyTest(UTRIE2_16_VALUE_BITS);
1172 dummyTest(UTRIE2_32_VALUE_BITS);
1173 }
1174
1175 /* test builder memory management ------------------------------------------- */
1176
1177 static void
FreeBlocksTest(void)1178 FreeBlocksTest(void) {
1179 static const CheckRange
1180 checkRanges[]={
1181 { 0, 1 },
1182 { 0x740, 1 },
1183 { 0x780, 2 },
1184 { 0x880, 3 },
1185 { 0x110000, 1 }
1186 };
1187 static const char *const testName="free-blocks";
1188
1189 UTrie2 *trie;
1190 int32_t i;
1191 UErrorCode errorCode;
1192
1193 errorCode=U_ZERO_ERROR;
1194 trie=utrie2_open(1, 0xbad, &errorCode);
1195 if(U_FAILURE(errorCode)) {
1196 log_err("error: utrie2_open(%s) failed: %s\n", testName, u_errorName(errorCode));
1197 return;
1198 }
1199
1200 /*
1201 * Repeatedly set overlapping same-value ranges to stress the free-data-block management.
1202 * If it fails, it will overflow the data array.
1203 */
1204 for(i=0; i<(0x120000>>UTRIE2_SHIFT_2)/2; ++i) {
1205 utrie2_setRange32(trie, 0x740, 0x840-1, 1, TRUE, &errorCode);
1206 utrie2_setRange32(trie, 0x780, 0x880-1, 1, TRUE, &errorCode);
1207 utrie2_setRange32(trie, 0x740, 0x840-1, 2, TRUE, &errorCode);
1208 utrie2_setRange32(trie, 0x780, 0x880-1, 3, TRUE, &errorCode);
1209 }
1210 /* make blocks that will be free during compaction */
1211 utrie2_setRange32(trie, 0x1000, 0x3000-1, 2, TRUE, &errorCode);
1212 utrie2_setRange32(trie, 0x2000, 0x4000-1, 3, TRUE, &errorCode);
1213 utrie2_setRange32(trie, 0x1000, 0x4000-1, 1, TRUE, &errorCode);
1214 /* set some values for lead surrogate code units */
1215 utrie2_set32ForLeadSurrogateCodeUnit(trie, 0xd800, 90, &errorCode);
1216 utrie2_set32ForLeadSurrogateCodeUnit(trie, 0xd999, 94, &errorCode);
1217 utrie2_set32ForLeadSurrogateCodeUnit(trie, 0xdbff, 99, &errorCode);
1218 if(U_FAILURE(errorCode)) {
1219 log_err("error: setting lots of ranges into a trie (%s) failed - %s\n",
1220 testName, u_errorName(errorCode));
1221 utrie2_close(trie);
1222 return;
1223 }
1224
1225 trie=testTrieSerializeAllValueBits(testName, trie, FALSE,
1226 checkRanges, UPRV_LENGTHOF(checkRanges));
1227 utrie2_close(trie);
1228 }
1229
1230 static void
GrowDataArrayTest(void)1231 GrowDataArrayTest(void) {
1232 static const CheckRange
1233 checkRanges[]={
1234 { 0, 1 },
1235 { 0x720, 2 },
1236 { 0x7a0, 3 },
1237 { 0x8a0, 4 },
1238 { 0x110000, 5 }
1239 };
1240 static const char *const testName="grow-data";
1241
1242 UTrie2 *trie;
1243 int32_t i;
1244 UErrorCode errorCode;
1245
1246 errorCode=U_ZERO_ERROR;
1247 trie=utrie2_open(1, 0xbad, &errorCode);
1248 if(U_FAILURE(errorCode)) {
1249 log_err("error: utrie2_open(%s) failed: %s\n", testName, u_errorName(errorCode));
1250 return;
1251 }
1252
1253 /*
1254 * Use utrie2_set32() not utrie2_setRange32() to write non-initialValue-data.
1255 * Should grow/reallocate the data array to a sufficient length.
1256 */
1257 for(i=0; i<0x1000; ++i) {
1258 utrie2_set32(trie, i, 2, &errorCode);
1259 }
1260 for(i=0x720; i<0x1100; ++i) { /* some overlap */
1261 utrie2_set32(trie, i, 3, &errorCode);
1262 }
1263 for(i=0x7a0; i<0x900; ++i) {
1264 utrie2_set32(trie, i, 4, &errorCode);
1265 }
1266 for(i=0x8a0; i<0x110000; ++i) {
1267 utrie2_set32(trie, i, 5, &errorCode);
1268 }
1269 for(i=0xd800; i<0xdc00; ++i) {
1270 utrie2_set32ForLeadSurrogateCodeUnit(trie, i, 1, &errorCode);
1271 }
1272 /* set some values for lead surrogate code units */
1273 utrie2_set32ForLeadSurrogateCodeUnit(trie, 0xd800, 90, &errorCode);
1274 utrie2_set32ForLeadSurrogateCodeUnit(trie, 0xd999, 94, &errorCode);
1275 utrie2_set32ForLeadSurrogateCodeUnit(trie, 0xdbff, 99, &errorCode);
1276 if(U_FAILURE(errorCode)) {
1277 log_err("error: setting lots of values into a trie (%s) failed - %s\n",
1278 testName, u_errorName(errorCode));
1279 utrie2_close(trie);
1280 return;
1281 }
1282
1283 trie=testTrieSerializeAllValueBits(testName, trie, FALSE,
1284 checkRanges, UPRV_LENGTHOF(checkRanges));
1285 utrie2_close(trie);
1286 }
1287
1288 /* versions 1 and 2 --------------------------------------------------------- */
1289
1290 static UNewTrie *
makeNewTrie1WithRanges(const char * testName,const SetRange setRanges[],int32_t countSetRanges,const CheckRange checkRanges[],int32_t countCheckRanges)1291 makeNewTrie1WithRanges(const char *testName,
1292 const SetRange setRanges[], int32_t countSetRanges,
1293 const CheckRange checkRanges[], int32_t countCheckRanges) {
1294 UNewTrie *newTrie;
1295 uint32_t initialValue, errorValue;
1296 uint32_t value;
1297 UChar32 start, limit;
1298 int32_t i;
1299 UErrorCode errorCode;
1300 UBool overwrite, ok;
1301
1302 log_verbose("\ntesting Trie '%s'\n", testName);
1303 errorCode=U_ZERO_ERROR;
1304 getSpecialValues(checkRanges, countCheckRanges, &initialValue, &errorValue);
1305 newTrie=utrie_open(NULL, NULL, 2000,
1306 initialValue, initialValue,
1307 FALSE);
1308 if(U_FAILURE(errorCode)) {
1309 log_err("error: utrie_open(%s) failed: %s\n", testName, u_errorName(errorCode));
1310 return NULL;
1311 }
1312
1313 /* set values from setRanges[] */
1314 ok=TRUE;
1315 for(i=0; i<countSetRanges; ++i) {
1316 start=setRanges[i].start;
1317 limit=setRanges[i].limit;
1318 value=setRanges[i].value;
1319 overwrite=setRanges[i].overwrite;
1320 if((limit-start)==1 && overwrite) {
1321 ok&=utrie_set32(newTrie, start, value);
1322 } else {
1323 ok&=utrie_setRange32(newTrie, start, limit, value, overwrite);
1324 }
1325 }
1326 if(ok) {
1327 return newTrie;
1328 } else {
1329 log_err("error: setting values into a trie1 (%s) failed\n", testName);
1330 utrie_close(newTrie);
1331 return NULL;
1332 }
1333 }
1334
1335 static void
testTrie2FromTrie1(const char * testName,const SetRange setRanges[],int32_t countSetRanges,const CheckRange checkRanges[],int32_t countCheckRanges)1336 testTrie2FromTrie1(const char *testName,
1337 const SetRange setRanges[], int32_t countSetRanges,
1338 const CheckRange checkRanges[], int32_t countCheckRanges) {
1339 uint32_t memory1_16[3000], memory1_32[3000];
1340 int32_t length16, length32;
1341 UChar lead;
1342
1343 char name[40];
1344
1345 UNewTrie *newTrie1_16, *newTrie1_32;
1346 UTrie trie1_16, trie1_32;
1347 UTrie2 *trie2;
1348 uint32_t initialValue, errorValue;
1349 UErrorCode errorCode;
1350
1351 newTrie1_16=makeNewTrie1WithRanges(testName,
1352 setRanges, countSetRanges,
1353 checkRanges, countCheckRanges);
1354 if(newTrie1_16==NULL) {
1355 return;
1356 }
1357 newTrie1_32=utrie_clone(NULL, newTrie1_16, NULL, 0);
1358 if(newTrie1_32==NULL) {
1359 utrie_close(newTrie1_16);
1360 return;
1361 }
1362 errorCode=U_ZERO_ERROR;
1363 length16=utrie_serialize(newTrie1_16, memory1_16, sizeof(memory1_16),
1364 NULL, TRUE, &errorCode);
1365 length32=utrie_serialize(newTrie1_32, memory1_32, sizeof(memory1_32),
1366 NULL, FALSE, &errorCode);
1367 utrie_unserialize(&trie1_16, memory1_16, length16, &errorCode);
1368 utrie_unserialize(&trie1_32, memory1_32, length32, &errorCode);
1369 utrie_close(newTrie1_16);
1370 utrie_close(newTrie1_32);
1371 if(U_FAILURE(errorCode)) {
1372 log_err("error: utrie_serialize or unserialize(%s) failed: %s\n",
1373 testName, u_errorName(errorCode));
1374 return;
1375 }
1376
1377 getSpecialValues(checkRanges, countCheckRanges, &initialValue, &errorValue);
1378
1379 uprv_strcpy(name, testName);
1380 uprv_strcat(name, ".16");
1381 trie2=utrie2_fromUTrie(&trie1_16, errorValue, &errorCode);
1382 if(U_SUCCESS(errorCode)) {
1383 testFrozenTrie(name, trie2, UTRIE2_16_VALUE_BITS, checkRanges, countCheckRanges);
1384 for(lead=0xd800; lead<0xdc00; ++lead) {
1385 uint32_t value1, value2;
1386 value1=UTRIE_GET16_FROM_LEAD(&trie1_16, lead);
1387 value2=UTRIE2_GET16_FROM_U16_SINGLE_LEAD(trie2, lead);
1388 if(value1!=value2) {
1389 log_err("error: utrie2_fromUTrie(%s) wrong value %ld!=%ld "
1390 "from lead surrogate code unit U+%04lx\n",
1391 name, (long)value2, (long)value1, (long)lead);
1392 break;
1393 }
1394 }
1395 }
1396 utrie2_close(trie2);
1397
1398 uprv_strcpy(name, testName);
1399 uprv_strcat(name, ".32");
1400 trie2=utrie2_fromUTrie(&trie1_32, errorValue, &errorCode);
1401 if(U_SUCCESS(errorCode)) {
1402 testFrozenTrie(name, trie2, UTRIE2_32_VALUE_BITS, checkRanges, countCheckRanges);
1403 for(lead=0xd800; lead<0xdc00; ++lead) {
1404 uint32_t value1, value2;
1405 value1=UTRIE_GET32_FROM_LEAD(&trie1_32, lead);
1406 value2=UTRIE2_GET32_FROM_U16_SINGLE_LEAD(trie2, lead);
1407 if(value1!=value2) {
1408 log_err("error: utrie2_fromUTrie(%s) wrong value %ld!=%ld "
1409 "from lead surrogate code unit U+%04lx\n",
1410 name, (long)value2, (long)value1, (long)lead);
1411 break;
1412 }
1413 }
1414 }
1415 utrie2_close(trie2);
1416 }
1417
1418 static void
Trie12ConversionTest(void)1419 Trie12ConversionTest(void) {
1420 testTrie2FromTrie1("trie1->trie2",
1421 setRanges2, UPRV_LENGTHOF(setRanges2),
1422 checkRanges2, UPRV_LENGTHOF(checkRanges2));
1423 }
1424
1425 void
addTrie2Test(TestNode ** root)1426 addTrie2Test(TestNode** root) {
1427 addTest(root, &TrieTest, "tsutil/trie2test/TrieTest");
1428 addTest(root, &EnumNewTrieForLeadSurrogateTest,
1429 "tsutil/trie2test/EnumNewTrieForLeadSurrogateTest");
1430 addTest(root, &DummyTrieTest, "tsutil/trie2test/DummyTrieTest");
1431 addTest(root, &FreeBlocksTest, "tsutil/trie2test/FreeBlocksTest");
1432 addTest(root, &GrowDataArrayTest, "tsutil/trie2test/GrowDataArrayTest");
1433 addTest(root, &Trie12ConversionTest, "tsutil/trie2test/Trie12ConversionTest");
1434 }
1435