• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /********************************************************************
2  * Copyright (c) 1999-2012, International Business Machines
3  * Corporation and others. All Rights Reserved.
4  ********************************************************************
5  *   Date        Name        Description
6  *   12/14/99    Madhu        Creation.
7  *   01/12/2000  Madhu        updated for changed API
8  ********************************************************************/
9 
10 #include "unicode/utypes.h"
11 
12 #if !UCONFIG_NO_BREAK_ITERATION
13 
14 #include "unicode/uchar.h"
15 #include "intltest.h"
16 #include "unicode/rbbi.h"
17 #include "unicode/schriter.h"
18 #include "rbbiapts.h"
19 #include "rbbidata.h"
20 #include "cstring.h"
21 #include "ubrkimpl.h"
22 #include "unicode/locid.h"
23 #include "unicode/ustring.h"
24 #include "unicode/utext.h"
25 #include "cmemory.h"
26 
27 /**
28  * API Test the RuleBasedBreakIterator class
29  */
30 
31 
32 #define TEST_ASSERT_SUCCESS(status) {if (U_FAILURE(status)) {\
33 dataerrln("Failure at file %s, line %d, error = %s", __FILE__, __LINE__, u_errorName(status));}}
34 
35 #define TEST_ASSERT(expr) {if ((expr) == FALSE) { \
36     errln("Test Failure at file %s, line %d: \"%s\" is false.\n", __FILE__, __LINE__, #expr);};}
37 
TestCloneEquals()38 void RBBIAPITest::TestCloneEquals()
39 {
40 
41     UErrorCode status=U_ZERO_ERROR;
42     RuleBasedBreakIterator* bi1     = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createCharacterInstance(Locale::getDefault(), status);
43     RuleBasedBreakIterator* biequal = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createCharacterInstance(Locale::getDefault(), status);
44     RuleBasedBreakIterator* bi3     = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createCharacterInstance(Locale::getDefault(), status);
45     RuleBasedBreakIterator* bi2     = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createWordInstance(Locale::getDefault(), status);
46     if(U_FAILURE(status)){
47         errcheckln(status, "Fail : in construction - %s", u_errorName(status));
48         return;
49     }
50 
51 
52     UnicodeString testString="Testing word break iterators's clone() and equals()";
53     bi1->setText(testString);
54     bi2->setText(testString);
55     biequal->setText(testString);
56 
57     bi3->setText("hello");
58 
59     logln((UnicodeString)"Testing equals()");
60 
61     logln((UnicodeString)"Testing == and !=");
62     UBool b = (*bi1 != *biequal);
63     b |= *bi1 == *bi2;
64     b |= *bi1 == *bi3;
65     if (b) {
66         errln((UnicodeString)"ERROR:1 RBBI's == and != operator failed.");
67     }
68 
69     if(*bi2 == *biequal || *bi2 == *bi1  || *biequal == *bi3)
70         errln((UnicodeString)"ERROR:2 RBBI's == and != operator  failed.");
71 
72 
73     // Quick test of RulesBasedBreakIterator assignment -
74     // Check that
75     //    two different iterators are !=
76     //    they are == after assignment
77     //    source and dest iterator produce the same next() after assignment.
78     //    deleting one doesn't disable the other.
79     logln("Testing assignment");
80     RuleBasedBreakIterator *bix = (RuleBasedBreakIterator *)BreakIterator::createLineInstance(Locale::getDefault(), status);
81     if(U_FAILURE(status)){
82         errcheckln(status, "Fail : in construction - %s", u_errorName(status));
83         return;
84     }
85 
86     RuleBasedBreakIterator biDefault, biDefault2;
87     if(U_FAILURE(status)){
88         errln((UnicodeString)"FAIL : in construction of default iterator");
89         return;
90     }
91     if (biDefault == *bix) {
92         errln((UnicodeString)"ERROR: iterators should not compare ==");
93         return;
94     }
95     if (biDefault != biDefault2) {
96         errln((UnicodeString)"ERROR: iterators should compare ==");
97         return;
98     }
99 
100 
101     UnicodeString   HelloString("Hello Kitty");
102     bix->setText(HelloString);
103     if (*bix == *bi2) {
104         errln(UnicodeString("ERROR: strings should not be equal before assignment."));
105     }
106     *bix = *bi2;
107     if (*bix != *bi2) {
108         errln(UnicodeString("ERROR: strings should be equal before assignment."));
109     }
110 
111     int bixnext = bix->next();
112     int bi2next = bi2->next();
113     if (! (bixnext == bi2next && bixnext == 7)) {
114         errln(UnicodeString("ERROR: iterators behaved differently after assignment."));
115     }
116     delete bix;
117     if (bi2->next() != 8) {
118         errln(UnicodeString("ERROR: iterator.next() failed after deleting copy."));
119     }
120 
121 
122 
123     logln((UnicodeString)"Testing clone()");
124     RuleBasedBreakIterator* bi1clone=(RuleBasedBreakIterator*)bi1->clone();
125     RuleBasedBreakIterator* bi2clone=(RuleBasedBreakIterator*)bi2->clone();
126 
127     if(*bi1clone != *bi1 || *bi1clone  != *biequal  ||
128       *bi1clone == *bi3 || *bi1clone == *bi2)
129         errln((UnicodeString)"ERROR:1 RBBI's clone() method failed");
130 
131     if(*bi2clone == *bi1 || *bi2clone == *biequal ||
132        *bi2clone == *bi3 || *bi2clone != *bi2)
133         errln((UnicodeString)"ERROR:2 RBBI's clone() method failed");
134 
135     if(bi1->getText() != bi1clone->getText()   ||
136        bi2clone->getText() != bi2->getText()   ||
137        *bi2clone == *bi1clone )
138         errln((UnicodeString)"ERROR: RBBI's clone() method failed");
139 
140     delete bi1clone;
141     delete bi2clone;
142     delete bi1;
143     delete bi3;
144     delete bi2;
145     delete biequal;
146 }
147 
TestBoilerPlate()148 void RBBIAPITest::TestBoilerPlate()
149 {
150     UErrorCode status = U_ZERO_ERROR;
151     BreakIterator* a = BreakIterator::createWordInstance(Locale("hi"), status);
152     BreakIterator* b = BreakIterator::createWordInstance(Locale("hi_IN"),status);
153     if (U_FAILURE(status)) {
154         errcheckln(status, "Creation of break iterator failed %s", u_errorName(status));
155         return;
156     }
157     if(*a!=*b){
158         errln("Failed: boilerplate method operator!= does not return correct results");
159     }
160     // Japanese word break iterators are identical to root with
161     // a dictionary-based break iterator
162     BreakIterator* c = BreakIterator::createCharacterInstance(Locale("ja"),status);
163     BreakIterator* d = BreakIterator::createCharacterInstance(Locale("root"),status);
164     if(c && d){
165         if(*c!=*d){
166             errln("Failed: boilerplate method operator== does not return correct results");
167         }
168     }else{
169         errln("creation of break iterator failed");
170     }
171     delete a;
172     delete b;
173     delete c;
174     delete d;
175 }
176 
TestgetRules()177 void RBBIAPITest::TestgetRules()
178 {
179     UErrorCode status=U_ZERO_ERROR;
180 
181     RuleBasedBreakIterator* bi1=(RuleBasedBreakIterator*)RuleBasedBreakIterator::createCharacterInstance(Locale::getDefault(), status);
182     RuleBasedBreakIterator* bi2=(RuleBasedBreakIterator*)RuleBasedBreakIterator::createWordInstance(Locale::getDefault(), status);
183     if(U_FAILURE(status)){
184         errcheckln(status, "FAIL: in construction - %s", u_errorName(status));
185         delete bi1;
186         delete bi2;
187         return;
188     }
189 
190 
191 
192     logln((UnicodeString)"Testing toString()");
193 
194     bi1->setText((UnicodeString)"Hello there");
195 
196     RuleBasedBreakIterator* bi3 =(RuleBasedBreakIterator*)bi1->clone();
197 
198     UnicodeString temp=bi1->getRules();
199     UnicodeString temp2=bi2->getRules();
200     UnicodeString temp3=bi3->getRules();
201     if( temp2.compare(temp3) ==0 || temp.compare(temp2) == 0 || temp.compare(temp3) != 0)
202         errln((UnicodeString)"ERROR: error in getRules() method");
203 
204     delete bi1;
205     delete bi2;
206     delete bi3;
207 }
TestHashCode()208 void RBBIAPITest::TestHashCode()
209 {
210     UErrorCode status=U_ZERO_ERROR;
211     RuleBasedBreakIterator* bi1     = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createCharacterInstance(Locale::getDefault(), status);
212     RuleBasedBreakIterator* bi3     = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createCharacterInstance(Locale::getDefault(), status);
213     RuleBasedBreakIterator* bi2     = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createWordInstance(Locale::getDefault(), status);
214     if(U_FAILURE(status)){
215         errcheckln(status, "Fail : in construction - %s", u_errorName(status));
216         delete bi1;
217         delete bi2;
218         delete bi3;
219         return;
220     }
221 
222 
223     logln((UnicodeString)"Testing hashCode()");
224 
225     bi1->setText((UnicodeString)"Hash code");
226     bi2->setText((UnicodeString)"Hash code");
227     bi3->setText((UnicodeString)"Hash code");
228 
229     RuleBasedBreakIterator* bi1clone= (RuleBasedBreakIterator*)bi1->clone();
230     RuleBasedBreakIterator* bi2clone= (RuleBasedBreakIterator*)bi2->clone();
231 
232     if(bi1->hashCode() != bi1clone->hashCode() ||  bi1->hashCode() != bi3->hashCode() ||
233         bi1clone->hashCode() != bi3->hashCode() || bi2->hashCode() != bi2clone->hashCode())
234         errln((UnicodeString)"ERROR: identical objects have different hashcodes");
235 
236     if(bi1->hashCode() == bi2->hashCode() ||  bi2->hashCode() == bi3->hashCode() ||
237         bi1clone->hashCode() == bi2clone->hashCode() || bi1clone->hashCode() == bi2->hashCode())
238         errln((UnicodeString)"ERROR: different objects have same hashcodes");
239 
240     delete bi1clone;
241     delete bi2clone;
242     delete bi1;
243     delete bi2;
244     delete bi3;
245 
246 }
TestGetSetAdoptText()247 void RBBIAPITest::TestGetSetAdoptText()
248 {
249     logln((UnicodeString)"Testing getText setText ");
250     IcuTestErrorCode status(*this, "TestGetSetAdoptText");
251     UnicodeString str1="first string.";
252     UnicodeString str2="Second string.";
253     LocalPointer<RuleBasedBreakIterator> charIter1((RuleBasedBreakIterator*)RuleBasedBreakIterator::createCharacterInstance(Locale::getDefault(), status));
254     LocalPointer<RuleBasedBreakIterator> wordIter1((RuleBasedBreakIterator*)RuleBasedBreakIterator::createWordInstance(Locale::getDefault(), status));
255     if(status.isFailure()){
256         errcheckln(status, "Fail : in construction - %s", status.errorName());
257             return;
258     }
259 
260 
261     CharacterIterator* text1= new StringCharacterIterator(str1);
262     CharacterIterator* text1Clone = text1->clone();
263     CharacterIterator* text2= new StringCharacterIterator(str2);
264     CharacterIterator* text3= new StringCharacterIterator(str2, 3, 10, 3); //  "ond str"
265 
266     wordIter1->setText(str1);
267     CharacterIterator *tci = &wordIter1->getText();
268     UnicodeString      tstr;
269     tci->getText(tstr);
270     TEST_ASSERT(tstr == str1);
271     if(wordIter1->current() != 0)
272         errln((UnicodeString)"ERROR:1 setText did not set the iteration position to the beginning of the text, it is" + wordIter1->current() + (UnicodeString)"\n");
273 
274     wordIter1->next(2);
275 
276     wordIter1->setText(str2);
277     if(wordIter1->current() != 0)
278         errln((UnicodeString)"ERROR:2 setText did not reset the iteration position to the beginning of the text, it is" + wordIter1->current() + (UnicodeString)"\n");
279 
280 
281     charIter1->adoptText(text1Clone);
282     TEST_ASSERT(wordIter1->getText() != charIter1->getText());
283     tci = &wordIter1->getText();
284     tci->getText(tstr);
285     TEST_ASSERT(tstr == str2);
286     tci = &charIter1->getText();
287     tci->getText(tstr);
288     TEST_ASSERT(tstr == str1);
289 
290 
291     LocalPointer<RuleBasedBreakIterator> rb((RuleBasedBreakIterator*)wordIter1->clone());
292     rb->adoptText(text1);
293     if(rb->getText() != *text1)
294         errln((UnicodeString)"ERROR:1 error in adoptText ");
295     rb->adoptText(text2);
296     if(rb->getText() != *text2)
297         errln((UnicodeString)"ERROR:2 error in adoptText ");
298 
299     // Adopt where iterator range is less than the entire orignal source string.
300     //   (With the change of the break engine to working with UText internally,
301     //    CharacterIterators starting at positions other than zero are not supported)
302     rb->adoptText(text3);
303     TEST_ASSERT(rb->preceding(2) == 0);
304     TEST_ASSERT(rb->following(11) == BreakIterator::DONE);
305     //if(rb->preceding(2) != 3) {
306     //    errln((UnicodeString)"ERROR:3 error in adoptText ");
307     //}
308     //if(rb->following(11) != BreakIterator::DONE) {
309     //    errln((UnicodeString)"ERROR:4 error in adoptText ");
310     //}
311 
312     // UText API
313     //
314     //   Quick test to see if UText is working at all.
315     //
316     const char *s1 = "\x68\x65\x6C\x6C\x6F\x20\x77\x6F\x72\x6C\x64"; /* "hello world" in UTF-8 */
317     const char *s2 = "\x73\x65\x65\x20\x79\x61"; /* "see ya" in UTF-8 */
318     //                012345678901
319 
320     status.reset();
321     LocalUTextPointer ut(utext_openUTF8(NULL, s1, -1, status));
322     wordIter1->setText(ut.getAlias(), status);
323     TEST_ASSERT_SUCCESS(status);
324 
325     int32_t pos;
326     pos = wordIter1->first();
327     TEST_ASSERT(pos==0);
328     pos = wordIter1->next();
329     TEST_ASSERT(pos==5);
330     pos = wordIter1->next();
331     TEST_ASSERT(pos==6);
332     pos = wordIter1->next();
333     TEST_ASSERT(pos==11);
334     pos = wordIter1->next();
335     TEST_ASSERT(pos==UBRK_DONE);
336 
337     status.reset();
338     LocalUTextPointer ut2(utext_openUTF8(NULL, s2, -1, status));
339     TEST_ASSERT_SUCCESS(status);
340     wordIter1->setText(ut2.getAlias(), status);
341     TEST_ASSERT_SUCCESS(status);
342 
343     pos = wordIter1->first();
344     TEST_ASSERT(pos==0);
345     pos = wordIter1->next();
346     TEST_ASSERT(pos==3);
347     pos = wordIter1->next();
348     TEST_ASSERT(pos==4);
349 
350     pos = wordIter1->last();
351     TEST_ASSERT(pos==6);
352     pos = wordIter1->previous();
353     TEST_ASSERT(pos==4);
354     pos = wordIter1->previous();
355     TEST_ASSERT(pos==3);
356     pos = wordIter1->previous();
357     TEST_ASSERT(pos==0);
358     pos = wordIter1->previous();
359     TEST_ASSERT(pos==UBRK_DONE);
360 
361     status.reset();
362     UnicodeString sEmpty;
363     LocalUTextPointer gut2(utext_openUnicodeString(NULL, &sEmpty, status));
364     wordIter1->getUText(gut2.getAlias(), status);
365     TEST_ASSERT_SUCCESS(status);
366     status.reset();
367 }
368 
369 
TestIteration()370 void RBBIAPITest::TestIteration()
371 {
372     // This test just verifies that the API is present.
373     // Testing for correct operation of the break rules happens elsewhere.
374 
375     UErrorCode status=U_ZERO_ERROR;
376     RuleBasedBreakIterator* bi  = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createCharacterInstance(Locale::getDefault(), status);
377     if (U_FAILURE(status) || bi == NULL)  {
378         errcheckln(status, "Failure creating character break iterator.  Status = %s", u_errorName(status));
379     }
380     delete bi;
381 
382     status=U_ZERO_ERROR;
383     bi  = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createWordInstance(Locale::getDefault(), status);
384     if (U_FAILURE(status) || bi == NULL)  {
385         errcheckln(status, "Failure creating Word break iterator.  Status = %s", u_errorName(status));
386     }
387     delete bi;
388 
389     status=U_ZERO_ERROR;
390     bi  = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createLineInstance(Locale::getDefault(), status);
391     if (U_FAILURE(status) || bi == NULL)  {
392         errcheckln(status, "Failure creating Line break iterator.  Status = %s", u_errorName(status));
393     }
394     delete bi;
395 
396     status=U_ZERO_ERROR;
397     bi  = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createSentenceInstance(Locale::getDefault(), status);
398     if (U_FAILURE(status) || bi == NULL)  {
399         errcheckln(status, "Failure creating Sentence break iterator.  Status = %s", u_errorName(status));
400     }
401     delete bi;
402 
403     status=U_ZERO_ERROR;
404     bi  = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createTitleInstance(Locale::getDefault(), status);
405     if (U_FAILURE(status) || bi == NULL)  {
406         errcheckln(status, "Failure creating Title break iterator.  Status = %s", u_errorName(status));
407     }
408     delete bi;
409 
410     status=U_ZERO_ERROR;
411     bi  = (RuleBasedBreakIterator*)RuleBasedBreakIterator::createCharacterInstance(Locale::getDefault(), status);
412     if (U_FAILURE(status) || bi == NULL)  {
413         errcheckln(status, "Failure creating character break iterator.  Status = %s", u_errorName(status));
414         return;   // Skip the rest of these tests.
415     }
416 
417 
418     UnicodeString testString="0123456789";
419     bi->setText(testString);
420 
421     int32_t i;
422     i = bi->first();
423     if (i != 0) {
424         errln("Incorrect value from bi->first().  Expected 0, got %d.", i);
425     }
426 
427     i = bi->last();
428     if (i != 10) {
429         errln("Incorrect value from bi->last().  Expected 10, got %d", i);
430     }
431 
432     //
433     // Previous
434     //
435     bi->last();
436     i = bi->previous();
437     if (i != 9) {
438         errln("Incorrect value from bi->last() at line %d.  Expected 9, got %d", __LINE__, i);
439     }
440 
441 
442     bi->first();
443     i = bi->previous();
444     if (i != BreakIterator::DONE) {
445         errln("Incorrect value from bi->previous() at line %d.  Expected DONE, got %d", __LINE__, i);
446     }
447 
448     //
449     // next()
450     //
451     bi->first();
452     i = bi->next();
453     if (i != 1) {
454         errln("Incorrect value from bi->next() at line %d.  Expected 1, got %d", __LINE__, i);
455     }
456 
457     bi->last();
458     i = bi->next();
459     if (i != BreakIterator::DONE) {
460         errln("Incorrect value from bi->next() at line %d.  Expected DONE, got %d", __LINE__, i);
461     }
462 
463 
464     //
465     //  current()
466     //
467     bi->first();
468     i = bi->current();
469     if (i != 0) {
470         errln("Incorrect value from bi->previous() at line %d.  Expected 0, got %d", __LINE__, i);
471     }
472 
473     bi->next();
474     i = bi->current();
475     if (i != 1) {
476         errln("Incorrect value from bi->previous() at line %d.  Expected 1, got %d", __LINE__, i);
477     }
478 
479     bi->last();
480     bi->next();
481     i = bi->current();
482     if (i != 10) {
483         errln("Incorrect value from bi->previous() at line %d.  Expected 10, got %d", __LINE__, i);
484     }
485 
486     bi->first();
487     bi->previous();
488     i = bi->current();
489     if (i != 0) {
490         errln("Incorrect value from bi->previous() at line %d.  Expected 0, got %d", __LINE__, i);
491     }
492 
493 
494     //
495     // Following()
496     //
497     i = bi->following(4);
498     if (i != 5) {
499         errln("Incorrect value from bi->following() at line %d.  Expected 5, got %d", __LINE__, i);
500     }
501 
502     i = bi->following(9);
503     if (i != 10) {
504         errln("Incorrect value from bi->following() at line %d.  Expected 10, got %d", __LINE__, i);
505     }
506 
507     i = bi->following(10);
508     if (i != BreakIterator::DONE) {
509         errln("Incorrect value from bi->following() at line %d.  Expected DONE, got %d", __LINE__, i);
510     }
511 
512 
513     //
514     // Preceding
515     //
516     i = bi->preceding(4);
517     if (i != 3) {
518         errln("Incorrect value from bi->preceding() at line %d.  Expected 3, got %d", __LINE__, i);
519     }
520 
521     i = bi->preceding(10);
522     if (i != 9) {
523         errln("Incorrect value from bi->preceding() at line %d.  Expected 9, got %d", __LINE__, i);
524     }
525 
526     i = bi->preceding(1);
527     if (i != 0) {
528         errln("Incorrect value from bi->preceding() at line %d.  Expected 0, got %d", __LINE__, i);
529     }
530 
531     i = bi->preceding(0);
532     if (i != BreakIterator::DONE) {
533         errln("Incorrect value from bi->preceding() at line %d.  Expected DONE, got %d", __LINE__, i);
534     }
535 
536 
537     //
538     // isBoundary()
539     //
540     bi->first();
541     if (bi->isBoundary(3) != TRUE) {
542         errln("Incorrect value from bi->isBoudary() at line %d.  Expected TRUE, got FALSE", __LINE__, i);
543     }
544     i = bi->current();
545     if (i != 3) {
546         errln("Incorrect value from bi->current() at line %d.  Expected 3, got %d", __LINE__, i);
547     }
548 
549 
550     if (bi->isBoundary(11) != FALSE) {
551         errln("Incorrect value from bi->isBoudary() at line %d.  Expected FALSE, got TRUE", __LINE__, i);
552     }
553     i = bi->current();
554     if (i != 10) {
555         errln("Incorrect value from bi->current() at line %d.  Expected 10, got %d", __LINE__, i);
556     }
557 
558     //
559     // next(n)
560     //
561     bi->first();
562     i = bi->next(4);
563     if (i != 4) {
564         errln("Incorrect value from bi->next() at line %d.  Expected 4, got %d", __LINE__, i);
565     }
566 
567     i = bi->next(6);
568     if (i != 10) {
569         errln("Incorrect value from bi->next() at line %d.  Expected 10, got %d", __LINE__, i);
570     }
571 
572     bi->first();
573     i = bi->next(11);
574     if (i != BreakIterator::DONE) {
575         errln("Incorrect value from bi->next() at line %d.  Expected BreakIterator::DONE, got %d", __LINE__, i);
576     }
577 
578     delete bi;
579 
580 }
581 
582 
583 
584 
585 
586 
TestBuilder()587 void RBBIAPITest::TestBuilder() {
588      UnicodeString rulesString1 = "$Letters = [:L:];\n"
589                                   "$Numbers = [:N:];\n"
590                                   "$Letters+;\n"
591                                   "$Numbers+;\n"
592                                   "[^$Letters $Numbers];\n"
593                                   "!.*;\n";
594      UnicodeString testString1  = "abc123..abc";
595                                 // 01234567890
596      int32_t bounds1[] = {0, 3, 6, 7, 8, 11};
597      UErrorCode status=U_ZERO_ERROR;
598      UParseError    parseError;
599 
600      RuleBasedBreakIterator *bi = new RuleBasedBreakIterator(rulesString1, parseError, status);
601      if(U_FAILURE(status)) {
602          dataerrln("Fail : in construction - %s", u_errorName(status));
603      } else {
604          bi->setText(testString1);
605          doBoundaryTest(*bi, testString1, bounds1);
606      }
607      delete bi;
608 }
609 
610 
611 //
612 //  TestQuoteGrouping
613 //       Single quotes within rules imply a grouping, so that a modifier
614 //       following the quoted text (* or +) applies to all of the quoted chars.
615 //
TestQuoteGrouping()616 void RBBIAPITest::TestQuoteGrouping() {
617      UnicodeString rulesString1 = "#Here comes the rule...\n"
618                                   "'$@!'*;\n"   //  (\$\@\!)*
619                                   ".;\n";
620 
621      UnicodeString testString1  = "$@!$@!X$@!!X";
622                                 // 0123456789012
623      int32_t bounds1[] = {0, 6, 7, 10, 11, 12};
624      UErrorCode status=U_ZERO_ERROR;
625      UParseError    parseError;
626 
627      RuleBasedBreakIterator *bi = new RuleBasedBreakIterator(rulesString1, parseError, status);
628      if(U_FAILURE(status)) {
629          dataerrln("Fail : in construction - %s", u_errorName(status));
630      } else {
631          bi->setText(testString1);
632          doBoundaryTest(*bi, testString1, bounds1);
633      }
634      delete bi;
635 }
636 
637 //
638 //  TestRuleStatus
639 //      Test word break rule status constants.
640 //
TestRuleStatus()641 void RBBIAPITest::TestRuleStatus() {
642      UChar str[30];
643      //no longer test Han or hiragana breaking here: ruleStatusVec would return nothing
644      // changed UBRK_WORD_KANA to UBRK_WORD_IDEO
645      u_unescape("plain word 123.45 \\u30a1\\u30a2 ",
646               // 012345678901234567  8      9    0
647               //                     Katakana
648                 str, 30);
649      UnicodeString testString1(str);
650      int32_t bounds1[] = {0, 5, 6, 10, 11, 17, 18, 20, 21};
651      int32_t tag_lo[]  = {UBRK_WORD_NONE,     UBRK_WORD_LETTER, UBRK_WORD_NONE,    UBRK_WORD_LETTER,
652                           UBRK_WORD_NONE,     UBRK_WORD_NUMBER, UBRK_WORD_NONE,
653                           UBRK_WORD_IDEO,     UBRK_WORD_NONE};
654 
655      int32_t tag_hi[]  = {UBRK_WORD_NONE_LIMIT, UBRK_WORD_LETTER_LIMIT, UBRK_WORD_NONE_LIMIT, UBRK_WORD_LETTER_LIMIT,
656                           UBRK_WORD_NONE_LIMIT, UBRK_WORD_NUMBER_LIMIT, UBRK_WORD_NONE_LIMIT,
657                           UBRK_WORD_IDEO_LIMIT, UBRK_WORD_NONE_LIMIT};
658 
659      UErrorCode status=U_ZERO_ERROR;
660 
661      RuleBasedBreakIterator *bi = (RuleBasedBreakIterator *)BreakIterator::createWordInstance(Locale::getEnglish(), status);
662      if(U_FAILURE(status)) {
663          errcheckln(status, "Fail : in construction - %s", u_errorName(status));
664      } else {
665          bi->setText(testString1);
666          // First test that the breaks are in the right spots.
667          doBoundaryTest(*bi, testString1, bounds1);
668 
669          // Then go back and check tag values
670          int32_t i = 0;
671          int32_t pos, tag;
672          for (pos = bi->first(); pos != BreakIterator::DONE; pos = bi->next(), i++) {
673              if (pos != bounds1[i]) {
674                  errln("FAIL: unexpected word break at postion %d", pos);
675                  break;
676              }
677              tag = bi->getRuleStatus();
678              if (tag < tag_lo[i] || tag >= tag_hi[i]) {
679                  errln("FAIL: incorrect tag value %d at position %d", tag, pos);
680                  break;
681              }
682 
683              // Check that we get the same tag values from getRuleStatusVec()
684              int32_t vec[10];
685              int t = bi->getRuleStatusVec(vec, 10, status);
686              TEST_ASSERT_SUCCESS(status);
687              TEST_ASSERT(t==1);
688              TEST_ASSERT(vec[0] == tag);
689          }
690      }
691      delete bi;
692 
693      // Now test line break status.  This test mostly is to confirm that the status constants
694      //                              are correctly declared in the header.
695      testString1 =   "test line. \n";
696      // break type    s    s     h
697 
698      bi = (RuleBasedBreakIterator *)
699          BreakIterator::createLineInstance(Locale::getEnglish(), status);
700      if(U_FAILURE(status)) {
701          errcheckln(status, "failed to create word break iterator. - %s", u_errorName(status));
702      } else {
703          int32_t i = 0;
704          int32_t pos, tag;
705          UBool   success;
706 
707          bi->setText(testString1);
708          pos = bi->current();
709          tag = bi->getRuleStatus();
710          for (i=0; i<3; i++) {
711              switch (i) {
712              case 0:
713                  success = pos==0  && tag==UBRK_LINE_SOFT; break;
714              case 1:
715                  success = pos==5  && tag==UBRK_LINE_SOFT; break;
716              case 2:
717                  success = pos==12 && tag==UBRK_LINE_HARD; break;
718              default:
719                  success = FALSE; break;
720              }
721              if (success == FALSE) {
722                  errln("Fail: incorrect word break status or position.  i=%d, pos=%d, tag=%d",
723                      i, pos, tag);
724                  break;
725              }
726              pos = bi->next();
727              tag = bi->getRuleStatus();
728          }
729          if (UBRK_LINE_SOFT >= UBRK_LINE_SOFT_LIMIT ||
730              UBRK_LINE_HARD >= UBRK_LINE_HARD_LIMIT ||
731              (UBRK_LINE_HARD > UBRK_LINE_SOFT && UBRK_LINE_HARD < UBRK_LINE_SOFT_LIMIT)) {
732              errln("UBRK_LINE_* constants from header are inconsistent.");
733          }
734      }
735      delete bi;
736 
737 }
738 
739 
740 //
741 //  TestRuleStatusVec
742 //      Test the vector form of  break rule status.
743 //
TestRuleStatusVec()744 void RBBIAPITest::TestRuleStatusVec() {
745     UnicodeString rulesString(   "[A-N]{100}; \n"
746                                  "[a-w]{200}; \n"
747                                  "[\\p{L}]{300}; \n"
748                                  "[\\p{N}]{400}; \n"
749                                  "[0-5]{500}; \n"
750                                   "!.*;\n", -1, US_INV);
751      UnicodeString testString1  = "Aapz5?";
752      int32_t  statusVals[10];
753      int32_t  numStatuses;
754      int32_t  pos;
755 
756      UErrorCode status=U_ZERO_ERROR;
757      UParseError    parseError;
758 
759      RuleBasedBreakIterator *bi = new RuleBasedBreakIterator(rulesString, parseError, status);
760      if (U_FAILURE(status)) {
761          dataerrln("Failure at file %s, line %d, error = %s", __FILE__, __LINE__, u_errorName(status));
762      } else {
763          bi->setText(testString1);
764 
765          // A
766          pos = bi->next();
767          TEST_ASSERT(pos==1);
768          numStatuses = bi->getRuleStatusVec(statusVals, 10, status);
769          TEST_ASSERT_SUCCESS(status);
770          TEST_ASSERT(numStatuses == 2);
771          TEST_ASSERT(statusVals[0] == 100);
772          TEST_ASSERT(statusVals[1] == 300);
773 
774          // a
775          pos = bi->next();
776          TEST_ASSERT(pos==2);
777          numStatuses = bi->getRuleStatusVec(statusVals, 10, status);
778          TEST_ASSERT_SUCCESS(status);
779          TEST_ASSERT(numStatuses == 2);
780          TEST_ASSERT(statusVals[0] == 200);
781          TEST_ASSERT(statusVals[1] == 300);
782 
783          // p
784          pos = bi->next();
785          TEST_ASSERT(pos==3);
786          numStatuses = bi->getRuleStatusVec(statusVals, 10, status);
787          TEST_ASSERT_SUCCESS(status);
788          TEST_ASSERT(numStatuses == 2);
789          TEST_ASSERT(statusVals[0] == 200);
790          TEST_ASSERT(statusVals[1] == 300);
791 
792          // z
793          pos = bi->next();
794          TEST_ASSERT(pos==4);
795          numStatuses = bi->getRuleStatusVec(statusVals, 10, status);
796          TEST_ASSERT_SUCCESS(status);
797          TEST_ASSERT(numStatuses == 1);
798          TEST_ASSERT(statusVals[0] == 300);
799 
800          // 5
801          pos = bi->next();
802          TEST_ASSERT(pos==5);
803          numStatuses = bi->getRuleStatusVec(statusVals, 10, status);
804          TEST_ASSERT_SUCCESS(status);
805          TEST_ASSERT(numStatuses == 2);
806          TEST_ASSERT(statusVals[0] == 400);
807          TEST_ASSERT(statusVals[1] == 500);
808 
809          // ?
810          pos = bi->next();
811          TEST_ASSERT(pos==6);
812          numStatuses = bi->getRuleStatusVec(statusVals, 10, status);
813          TEST_ASSERT_SUCCESS(status);
814          TEST_ASSERT(numStatuses == 1);
815          TEST_ASSERT(statusVals[0] == 0);
816 
817          //
818          //  Check buffer overflow error handling.   Char == A
819          //
820          bi->first();
821          pos = bi->next();
822          TEST_ASSERT(pos==1);
823          memset(statusVals, -1, sizeof(statusVals));
824          numStatuses = bi->getRuleStatusVec(statusVals, 0, status);
825          TEST_ASSERT(status == U_BUFFER_OVERFLOW_ERROR);
826          TEST_ASSERT(numStatuses == 2);
827          TEST_ASSERT(statusVals[0] == -1);
828 
829          status = U_ZERO_ERROR;
830          memset(statusVals, -1, sizeof(statusVals));
831          numStatuses = bi->getRuleStatusVec(statusVals, 1, status);
832          TEST_ASSERT(status == U_BUFFER_OVERFLOW_ERROR);
833          TEST_ASSERT(numStatuses == 2);
834          TEST_ASSERT(statusVals[0] == 100);
835          TEST_ASSERT(statusVals[1] == -1);
836 
837          status = U_ZERO_ERROR;
838          memset(statusVals, -1, sizeof(statusVals));
839          numStatuses = bi->getRuleStatusVec(statusVals, 2, status);
840          TEST_ASSERT_SUCCESS(status);
841          TEST_ASSERT(numStatuses == 2);
842          TEST_ASSERT(statusVals[0] == 100);
843          TEST_ASSERT(statusVals[1] == 300);
844          TEST_ASSERT(statusVals[2] == -1);
845      }
846      delete bi;
847 
848 }
849 
850 //
851 //   Bug 2190 Regression test.   Builder crash on rule consisting of only a
852 //                               $variable reference
TestBug2190()853 void RBBIAPITest::TestBug2190() {
854      UnicodeString rulesString1 = "$aaa = abcd;\n"
855                                   "$bbb = $aaa;\n"
856                                   "$bbb;\n";
857      UnicodeString testString1  = "abcdabcd";
858                                 // 01234567890
859      int32_t bounds1[] = {0, 4, 8};
860      UErrorCode status=U_ZERO_ERROR;
861      UParseError    parseError;
862 
863      RuleBasedBreakIterator *bi = new RuleBasedBreakIterator(rulesString1, parseError, status);
864      if(U_FAILURE(status)) {
865          dataerrln("Fail : in construction - %s", u_errorName(status));
866      } else {
867          bi->setText(testString1);
868          doBoundaryTest(*bi, testString1, bounds1);
869      }
870      delete bi;
871 }
872 
873 
TestRegistration()874 void RBBIAPITest::TestRegistration() {
875 #if !UCONFIG_NO_SERVICE
876     UErrorCode status = U_ZERO_ERROR;
877     BreakIterator* ja_word = BreakIterator::createWordInstance("ja_JP", status);
878     // ok to not delete these if we exit because of error?
879     BreakIterator* ja_char = BreakIterator::createCharacterInstance("ja_JP", status);
880     BreakIterator* root_word = BreakIterator::createWordInstance("", status);
881     BreakIterator* root_char = BreakIterator::createCharacterInstance("", status);
882 
883     if (status == U_MISSING_RESOURCE_ERROR || status == U_FILE_ACCESS_ERROR) {
884         dataerrln("Error creating instances of break interactors - %s", u_errorName(status));
885 
886         delete ja_word;
887         delete ja_char;
888         delete root_word;
889         delete root_char;
890 
891         return;
892     }
893 
894     URegistryKey key = BreakIterator::registerInstance(ja_word, "xx", UBRK_WORD, status);
895     {
896 #if 0 // With a dictionary based word breaking, ja_word is identical to root.
897         if (ja_word && *ja_word == *root_word) {
898             errln("japan not different from root");
899         }
900 #endif
901     }
902 
903     {
904         BreakIterator* result = BreakIterator::createWordInstance("xx_XX", status);
905         UBool fail = TRUE;
906         if(result){
907             fail = *result != *ja_word;
908         }
909         delete result;
910         if (fail) {
911             errln("bad result for xx_XX/word");
912         }
913     }
914 
915     {
916         BreakIterator* result = BreakIterator::createCharacterInstance("ja_JP", status);
917         UBool fail = TRUE;
918         if(result){
919             fail = *result != *ja_char;
920         }
921         delete result;
922         if (fail) {
923             errln("bad result for ja_JP/char");
924         }
925     }
926 
927     {
928         BreakIterator* result = BreakIterator::createCharacterInstance("xx_XX", status);
929         UBool fail = TRUE;
930         if(result){
931             fail = *result != *root_char;
932         }
933         delete result;
934         if (fail) {
935             errln("bad result for xx_XX/char");
936         }
937     }
938 
939     {
940         StringEnumeration* avail = BreakIterator::getAvailableLocales();
941         UBool found = FALSE;
942         const UnicodeString* p;
943         while ((p = avail->snext(status))) {
944             if (p->compare("xx") == 0) {
945                 found = TRUE;
946                 break;
947             }
948         }
949         delete avail;
950         if (!found) {
951             errln("did not find test locale");
952         }
953     }
954 
955     {
956         UBool unreg = BreakIterator::unregister(key, status);
957         if (!unreg) {
958             errln("unable to unregister");
959         }
960     }
961 
962     {
963         BreakIterator* result = BreakIterator::createWordInstance("en_US", status);
964         BreakIterator* root = BreakIterator::createWordInstance("", status);
965         UBool fail = TRUE;
966         if(root){
967           fail = *root != *result;
968         }
969         delete root;
970         delete result;
971         if (fail) {
972             errln("did not get root break");
973         }
974     }
975 
976     {
977         StringEnumeration* avail = BreakIterator::getAvailableLocales();
978         UBool found = FALSE;
979         const UnicodeString* p;
980         while ((p = avail->snext(status))) {
981             if (p->compare("xx") == 0) {
982                 found = TRUE;
983                 break;
984             }
985         }
986         delete avail;
987         if (found) {
988             errln("found test locale");
989         }
990     }
991 
992     {
993         int32_t count;
994         UBool   foundLocale = FALSE;
995         const Locale *avail = BreakIterator::getAvailableLocales(count);
996         for (int i=0; i<count; i++) {
997             if (avail[i] == Locale::getEnglish()) {
998                 foundLocale = TRUE;
999                 break;
1000             }
1001         }
1002         if (foundLocale == FALSE) {
1003             errln("BreakIterator::getAvailableLocales(&count), failed to find EN.");
1004         }
1005     }
1006 
1007 
1008     // ja_word was adopted by factory
1009     delete ja_char;
1010     delete root_word;
1011     delete root_char;
1012 #endif
1013 }
1014 
RoundtripRule(const char * dataFile)1015 void RBBIAPITest::RoundtripRule(const char *dataFile) {
1016     UErrorCode status = U_ZERO_ERROR;
1017     UParseError parseError;
1018     parseError.line = 0;
1019     parseError.offset = 0;
1020     LocalUDataMemoryPointer data(udata_open(U_ICUDATA_BRKITR, "brk", dataFile, &status));
1021     uint32_t length;
1022     const UChar *builtSource;
1023     const uint8_t *rbbiRules;
1024     const uint8_t *builtRules;
1025 
1026     if (U_FAILURE(status)) {
1027         errcheckln(status, "Can't open \"%s\" - %s", dataFile, u_errorName(status));
1028         return;
1029     }
1030 
1031     builtRules = (const uint8_t *)udata_getMemory(data.getAlias());
1032     builtSource = (const UChar *)(builtRules + ((RBBIDataHeader*)builtRules)->fRuleSource);
1033     RuleBasedBreakIterator *brkItr = new RuleBasedBreakIterator(builtSource, parseError, status);
1034     if (U_FAILURE(status)) {
1035         errln("createRuleBasedBreakIterator: ICU Error \"%s\"  at line %d, column %d\n",
1036                 u_errorName(status), parseError.line, parseError.offset);
1037         return;
1038     };
1039     rbbiRules = brkItr->getBinaryRules(length);
1040     logln("Comparing \"%s\" len=%d", dataFile, length);
1041     if (memcmp(builtRules, rbbiRules, (int32_t)length) != 0) {
1042         errln("Built rules and rebuilt rules are different %s", dataFile);
1043         return;
1044     }
1045     delete brkItr;
1046 }
1047 
TestRoundtripRules()1048 void RBBIAPITest::TestRoundtripRules() {
1049     RoundtripRule("word");
1050     RoundtripRule("title");
1051     RoundtripRule("sent");
1052     RoundtripRule("line");
1053     RoundtripRule("char");
1054     if (!quick) {
1055         RoundtripRule("word_POSIX");
1056     }
1057 }
1058 
1059 // Try out the RuleBasedBreakIterator constructors that take RBBIDataHeader*
1060 // (these are protected so we access them via a local class RBBIWithProtectedFunctions).
1061 // This is just a sanity check, not a thorough test (e.g. we don't check that the
1062 // first delete actually frees rulesCopy).
TestCreateFromRBBIData()1063 void RBBIAPITest::TestCreateFromRBBIData() {
1064     // Get some handy RBBIData
1065     const char *brkName = "word"; // or "sent", "line", "char", etc.
1066     UErrorCode status = U_ZERO_ERROR;
1067     LocalUDataMemoryPointer data(udata_open(U_ICUDATA_BRKITR, "brk", brkName, &status));
1068     if ( U_SUCCESS(status) ) {
1069         const RBBIDataHeader * builtRules = (const RBBIDataHeader *)udata_getMemory(data.getAlias());
1070         uint32_t length = builtRules->fLength;
1071         RBBIWithProtectedFunctions * brkItr;
1072 
1073         // Try the memory-adopting constructor, need to copy the data first
1074         RBBIDataHeader * rulesCopy = (RBBIDataHeader *) uprv_malloc(length);
1075         if ( rulesCopy ) {
1076             uprv_memcpy( rulesCopy, builtRules, length );
1077 
1078             brkItr = new RBBIWithProtectedFunctions(rulesCopy, status);
1079             if ( U_SUCCESS(status) ) {
1080                 delete brkItr; // this should free rulesCopy
1081             } else {
1082                 errln("create RuleBasedBreakIterator from RBBIData (adopted): ICU Error \"%s\"\n", u_errorName(status) );
1083                 status = U_ZERO_ERROR;// reset for the next test
1084                 uprv_free( rulesCopy );
1085             }
1086         }
1087 
1088         // Now try the non-adopting constructor
1089         brkItr = new RBBIWithProtectedFunctions(builtRules, RBBIWithProtectedFunctions::kDontAdopt, status);
1090         if ( U_SUCCESS(status) ) {
1091             delete brkItr; // this should NOT attempt to free builtRules
1092             if (builtRules->fLength != length) { // sanity check
1093                 errln("create RuleBasedBreakIterator from RBBIData (non-adopted): delete affects data\n" );
1094             }
1095         } else {
1096             errln("create RuleBasedBreakIterator from RBBIData (non-adopted): ICU Error \"%s\"\n", u_errorName(status) );
1097         }
1098     }
1099 
1100     // getBinaryRules() and RuleBasedBreakIterator(uint8_t binaryRules, ...)
1101     //
1102     status = U_ZERO_ERROR;
1103     RuleBasedBreakIterator *rb = (RuleBasedBreakIterator *)BreakIterator::createWordInstance(Locale::getEnglish(), status);
1104     if (rb == NULL || U_FAILURE(status)) {
1105         dataerrln("Unable to create BreakIterator::createWordInstance (Locale::getEnglish) - %s", u_errorName(status));
1106     } else {
1107         uint32_t length;
1108         const uint8_t *rules = rb->getBinaryRules(length);
1109         RuleBasedBreakIterator *rb2 = new RuleBasedBreakIterator(rules, length, status);
1110         TEST_ASSERT_SUCCESS(status);
1111         TEST_ASSERT(*rb == *rb2);
1112         UnicodeString words = "one two three ";
1113         rb2->setText(words);
1114         int wordCounter = 0;
1115         while (rb2->next() != UBRK_DONE) {
1116             wordCounter++;
1117         }
1118         TEST_ASSERT(wordCounter == 6);
1119 
1120         status = U_ZERO_ERROR;
1121         RuleBasedBreakIterator *rb3 = new RuleBasedBreakIterator(rules, length-1, status);
1122         TEST_ASSERT(status == U_ILLEGAL_ARGUMENT_ERROR);
1123 
1124         delete rb;
1125         delete rb2;
1126         delete rb3;
1127     }
1128 }
1129 
1130 
TestRefreshInputText()1131 void RBBIAPITest::TestRefreshInputText() {
1132     /*
1133      *  RefreshInput changes out the input of a Break Iterator without
1134      *    changing anything else in the iterator's state.  Used with Java JNI,
1135      *    when Java moves the underlying string storage.   This test
1136      *    runs BreakIterator::next() repeatedly, moving the text in the middle of the sequence.
1137      *    The right set of boundaries should still be found.
1138      */
1139     UChar testStr[]  = {0x20, 0x41, 0x20, 0x42, 0x20, 0x43, 0x20, 0x44, 0x0};  /* = " A B C D"  */
1140     UChar movedStr[] = {0x20, 0x20, 0x20, 0x20, 0x20, 0x20, 0x20, 0x20,  0};
1141     UErrorCode status = U_ZERO_ERROR;
1142     UText ut1 = UTEXT_INITIALIZER;
1143     UText ut2 = UTEXT_INITIALIZER;
1144     RuleBasedBreakIterator *bi = (RuleBasedBreakIterator *)BreakIterator::createLineInstance(Locale::getEnglish(), status);
1145     TEST_ASSERT_SUCCESS(status);
1146 
1147     utext_openUChars(&ut1, testStr, -1, &status);
1148     TEST_ASSERT_SUCCESS(status);
1149 
1150     if (U_SUCCESS(status)) {
1151         bi->setText(&ut1, status);
1152         TEST_ASSERT_SUCCESS(status);
1153 
1154         /* Line boundaries will occur before each letter in the original string */
1155         TEST_ASSERT(1 == bi->next());
1156         TEST_ASSERT(3 == bi->next());
1157 
1158         /* Move the string, kill the original string.  */
1159         u_strcpy(movedStr, testStr);
1160         u_memset(testStr, 0x20, u_strlen(testStr));
1161         utext_openUChars(&ut2, movedStr, -1, &status);
1162         TEST_ASSERT_SUCCESS(status);
1163         RuleBasedBreakIterator *returnedBI = &bi->refreshInputText(&ut2, status);
1164         TEST_ASSERT_SUCCESS(status);
1165         TEST_ASSERT(bi == returnedBI);
1166 
1167         /* Find the following matches, now working in the moved string. */
1168         TEST_ASSERT(5 == bi->next());
1169         TEST_ASSERT(7 == bi->next());
1170         TEST_ASSERT(8 == bi->next());
1171         TEST_ASSERT(UBRK_DONE == bi->next());
1172 
1173         utext_close(&ut1);
1174         utext_close(&ut2);
1175     }
1176     delete bi;
1177 
1178 }
1179 
1180 
1181 //---------------------------------------------
1182 // runIndexedTest
1183 //---------------------------------------------
1184 
runIndexedTest(int32_t index,UBool exec,const char * & name,char *)1185 void RBBIAPITest::runIndexedTest( int32_t index, UBool exec, const char* &name, char* /*par*/ )
1186 {
1187     if (exec) logln((UnicodeString)"TestSuite RuleBasedBreakIterator API ");
1188     switch (index) {
1189      //   case 0: name = "TestConstruction"; if (exec) TestConstruction(); break;
1190 #if !UCONFIG_NO_FILE_IO
1191         case  0: name = "TestCloneEquals"; if (exec) TestCloneEquals(); break;
1192         case  1: name = "TestgetRules"; if (exec) TestgetRules(); break;
1193         case  2: name = "TestHashCode"; if (exec) TestHashCode(); break;
1194         case  3: name = "TestGetSetAdoptText"; if (exec) TestGetSetAdoptText(); break;
1195         case  4: name = "TestIteration"; if (exec) TestIteration(); break;
1196 #else
1197         case  0: case  1: case  2: case  3: case  4: name = "skip"; break;
1198 #endif
1199         case  5: name = "TestBuilder"; if (exec) TestBuilder(); break;
1200         case  6: name = "TestQuoteGrouping"; if (exec) TestQuoteGrouping(); break;
1201         case  7: name = "TestRuleStatusVec"; if (exec) TestRuleStatusVec(); break;
1202         case  8: name = "TestBug2190"; if (exec) TestBug2190(); break;
1203 #if !UCONFIG_NO_FILE_IO
1204         case  9: name = "TestRegistration"; if (exec) TestRegistration(); break;
1205         case 10: name = "TestBoilerPlate"; if (exec) TestBoilerPlate(); break;
1206         case 11: name = "TestRuleStatus"; if (exec) TestRuleStatus(); break;
1207         case 12: name = "TestRoundtripRules"; if (exec) TestRoundtripRules(); break;
1208         case 13: name = "TestCreateFromRBBIData"; if (exec) TestCreateFromRBBIData(); break;
1209 #else
1210         case  9: case 10: case 11: case 12: case 13: name = "skip"; break;
1211 #endif
1212         case 14: name = "TestRefreshInputText"; if (exec) TestRefreshInputText(); break;
1213 
1214         default: name = ""; break; // needed to end loop
1215     }
1216 }
1217 
1218 //---------------------------------------------
1219 //Internal subroutines
1220 //---------------------------------------------
1221 
doBoundaryTest(RuleBasedBreakIterator & bi,UnicodeString & text,int32_t * boundaries)1222 void RBBIAPITest::doBoundaryTest(RuleBasedBreakIterator& bi, UnicodeString& text, int32_t *boundaries){
1223      logln((UnicodeString)"testIsBoundary():");
1224         int32_t p = 0;
1225         UBool isB;
1226         for (int32_t i = 0; i < text.length(); i++) {
1227             isB = bi.isBoundary(i);
1228             logln((UnicodeString)"bi.isBoundary(" + i + ") -> " + isB);
1229 
1230             if (i == boundaries[p]) {
1231                 if (!isB)
1232                     errln((UnicodeString)"Wrong result from isBoundary() for " + i + (UnicodeString)": expected true, got false");
1233                 p++;
1234             }
1235             else {
1236                 if (isB)
1237                     errln((UnicodeString)"Wrong result from isBoundary() for " + i + (UnicodeString)": expected false, got true");
1238             }
1239         }
1240 }
doTest(UnicodeString & testString,int32_t start,int32_t gotoffset,int32_t expectedOffset,const char * expectedString)1241 void RBBIAPITest::doTest(UnicodeString& testString, int32_t start, int32_t gotoffset, int32_t expectedOffset, const char* expectedString){
1242     UnicodeString selected;
1243     UnicodeString expected=CharsToUnicodeString(expectedString);
1244 
1245     if(gotoffset != expectedOffset)
1246          errln((UnicodeString)"ERROR:****returned #" + gotoffset + (UnicodeString)" instead of #" + expectedOffset);
1247     if(start <= gotoffset){
1248         testString.extractBetween(start, gotoffset, selected);
1249     }
1250     else{
1251         testString.extractBetween(gotoffset, start, selected);
1252     }
1253     if(selected.compare(expected) != 0)
1254          errln(prettify((UnicodeString)"ERROR:****selected \"" + selected + "\" instead of \"" + expected + "\""));
1255     else
1256         logln(prettify("****selected \"" + selected + "\""));
1257 }
1258 
1259 //---------------------------------------------
1260 //RBBIWithProtectedFunctions class functions
1261 //---------------------------------------------
1262 
RBBIWithProtectedFunctions(RBBIDataHeader * data,UErrorCode & status)1263 RBBIWithProtectedFunctions::RBBIWithProtectedFunctions(RBBIDataHeader* data, UErrorCode &status)
1264     : RuleBasedBreakIterator(data, status)
1265 {
1266 }
1267 
RBBIWithProtectedFunctions(const RBBIDataHeader * data,enum EDontAdopt,UErrorCode & status)1268 RBBIWithProtectedFunctions::RBBIWithProtectedFunctions(const RBBIDataHeader* data, enum EDontAdopt, UErrorCode &status)
1269     : RuleBasedBreakIterator(data, RuleBasedBreakIterator::kDontAdopt, status)
1270 {
1271 }
1272 
1273 #endif /* #if !UCONFIG_NO_BREAK_ITERATION */
1274