1 // Copyright (C) 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /****************************************************************************************
4  * COPYRIGHT:
5  * Copyright (c) 1997-2014, International Business Machines Corporation and
6  * others. All Rights Reserved.
7  * Modification History:
8  *
9  *   Date          Name        Description
10  *   05/22/2000    Madhu       Added tests for testing new API for utf16 support and more
11  ****************************************************************************************/
12 
13 #include <string.h>
14 #include "utypeinfo.h"  // for 'typeid' to work
15 
16 #include "unicode/chariter.h"
17 #include "unicode/ustring.h"
18 #include "unicode/unistr.h"
19 #include "unicode/schriter.h"
20 #include "unicode/uchriter.h"
21 #include "unicode/uiter.h"
22 #include "unicode/putil.h"
23 #include "unicode/utf16.h"
24 #include "citrtest.h"
25 #include "cmemory.h"
26 
27 
28 class  SCharacterIterator : public CharacterIterator {
29 public:
SCharacterIterator(const UnicodeString & textStr)30     SCharacterIterator(const UnicodeString& textStr){
31         text = textStr;
32         pos=0;
33         textLength = textStr.length();
34         begin = 0;
35         end=textLength;
36 
37     }
38 
~SCharacterIterator()39     virtual ~SCharacterIterator(){};
40 
41 
setText(const UnicodeString & newText)42     void setText(const UnicodeString& newText){
43         text = newText;
44     }
45 
getText(UnicodeString & result)46     virtual void getText(UnicodeString& result) {
47         text.extract(0,text.length(),result);
48     }
getStaticClassID(void)49     static UClassID getStaticClassID(void){
50         return (UClassID)(&fgClassID);
51     }
getDynamicClassID(void) const52     virtual UClassID getDynamicClassID(void) const{
53         return getStaticClassID();
54     }
55 
operator ==(const ForwardCharacterIterator &) const56     virtual UBool operator==(const ForwardCharacterIterator& /*that*/) const{
57         return TRUE;
58     }
59 
clone(void) const60     virtual CharacterIterator* clone(void) const {
61         return NULL;
62     }
hashCode(void) const63     virtual int32_t hashCode(void) const{
64         return DONE;
65     }
nextPostInc(void)66     virtual UChar nextPostInc(void){ return text.charAt(pos++);}
next32PostInc(void)67     virtual UChar32 next32PostInc(void){return text.char32At(pos++);}
hasNext()68     virtual UBool hasNext() { return TRUE;};
first()69     virtual UChar first(){return DONE;};
first32()70     virtual UChar32 first32(){return DONE;};
last()71     virtual UChar last(){return DONE;};
last32()72     virtual UChar32 last32(){return DONE;};
setIndex(int32_t)73     virtual UChar setIndex(int32_t /*pos*/){return DONE;};
setIndex32(int32_t)74     virtual UChar32 setIndex32(int32_t /*pos*/){return DONE;};
current() const75     virtual UChar current() const{return DONE;};
current32() const76     virtual UChar32 current32() const{return DONE;};
next()77     virtual UChar next(){return DONE;};
next32()78     virtual UChar32 next32(){return DONE;};
previous()79     virtual UChar previous(){return DONE;};
previous32()80     virtual UChar32 previous32(){return DONE;};
move(int32_t delta,CharacterIterator::EOrigin origin)81     virtual int32_t move(int32_t delta,CharacterIterator::EOrigin origin){
82         switch(origin) {
83         case kStart:
84             pos = begin + delta;
85             break;
86         case kCurrent:
87             pos += delta;
88             break;
89         case kEnd:
90             pos = end + delta;
91             break;
92         default:
93             break;
94         }
95 
96         if(pos < begin) {
97             pos = begin;
98         } else if(pos > end) {
99             pos = end;
100         }
101 
102         return pos;
103     };
move32(int32_t delta,CharacterIterator::EOrigin origin)104     virtual int32_t move32(int32_t delta, CharacterIterator::EOrigin origin){
105         switch(origin) {
106         case kStart:
107             pos = begin;
108             if(delta > 0) {
109                 U16_FWD_N(text, pos, end, delta);
110             }
111             break;
112         case kCurrent:
113             if(delta > 0) {
114                 U16_FWD_N(text, pos, end, delta);
115             } else {
116                 U16_BACK_N(text, begin, pos, -delta);
117             }
118             break;
119         case kEnd:
120             pos = end;
121             if(delta < 0) {
122                 U16_BACK_N(text, begin, pos, -delta);
123             }
124             break;
125         default:
126             break;
127         }
128 
129         return pos;
130     };
hasPrevious()131     virtual UBool hasPrevious() {return TRUE;};
132 
operator =(const SCharacterIterator & that)133   SCharacterIterator&  operator=(const SCharacterIterator&    that){
134      text = that.text;
135      return *this;
136   }
137 
138 
139 private:
140     UnicodeString text;
141     static const char fgClassID;
142 };
143 const char SCharacterIterator::fgClassID=0;
144 
CharIterTest()145 CharIterTest::CharIterTest()
146 {
147 }
runIndexedTest(int32_t index,UBool exec,const char * & name,char *)148 void CharIterTest::runIndexedTest( int32_t index, UBool exec, const char* &name, char* /*par*/ )
149 {
150     if (exec) logln("TestSuite CharIterTest: ");
151     switch (index) {
152         case 0: name = "TestConstructionAndEquality"; if (exec) TestConstructionAndEquality(); break;
153         case 1: name = "TestConstructionAndEqualityUChariter"; if (exec) TestConstructionAndEqualityUChariter(); break;
154         case 2: name = "TestIteration"; if (exec) TestIteration(); break;
155         case 3: name = "TestIterationUChar32"; if (exec) TestIterationUChar32(); break;
156         case 4: name = "TestUCharIterator"; if (exec) TestUCharIterator(); break;
157         case 5: name = "TestCoverage"; if(exec) TestCoverage(); break;
158         case 6: name = "TestCharIteratorSubClasses"; if (exec) TestCharIteratorSubClasses(); break;
159         default: name = ""; break; //needed to end loop
160     }
161 }
162 
TestCoverage()163 void CharIterTest::TestCoverage(){
164     UnicodeString  testText("Now is the time for all good men to come to the aid of their country.");
165     UnicodeString testText2("\\ud800\\udc01deadbeef");
166     testText2 = testText2.unescape();
167     SCharacterIterator* test = new SCharacterIterator(testText);
168     if(test->firstPostInc()!= 0x004E){
169         errln("Failed: firstPostInc() failed");
170     }
171     if(test->getIndex()!=1){
172         errln("Failed: getIndex().");
173     }
174     if(test->getLength()!=testText.length()){
175         errln("Failed: getLength()");
176     }
177     test->setToStart();
178     if(test->getIndex()!=0){
179         errln("Failed: setToStart().");
180     }
181     test->setToEnd();
182     if(test->getIndex()!=testText.length()){
183         errln("Failed: setToEnd().");
184     }
185     if(test->startIndex() != 0){
186         errln("Failed: startIndex()");
187     }
188     test->setText(testText2);
189     if(test->first32PostInc()!= testText2.char32At(0)){
190         errln("Failed: first32PostInc() failed");
191     }
192 
193     delete test;
194 
195 }
TestConstructionAndEquality()196 void CharIterTest::TestConstructionAndEquality() {
197     UnicodeString  testText("Now is the time for all good men to come to the aid of their country.");
198     UnicodeString  testText2("Don't bother using this string.");
199     UnicodeString result1, result2, result3;
200 
201     CharacterIterator* test1 = new StringCharacterIterator(testText);
202     CharacterIterator* test1b= new StringCharacterIterator(testText, -1);
203     CharacterIterator* test1c= new StringCharacterIterator(testText, 100);
204     CharacterIterator* test1d= new StringCharacterIterator(testText, -2, 100, 5);
205     CharacterIterator* test1e= new StringCharacterIterator(testText, 100, 20, 5);
206     CharacterIterator* test2 = new StringCharacterIterator(testText, 5);
207     CharacterIterator* test3 = new StringCharacterIterator(testText, 2, 20, 5);
208     CharacterIterator* test4 = new StringCharacterIterator(testText2);
209     CharacterIterator* test5 = test1->clone();
210 
211     if (test1d->startIndex() < 0)
212         errln("Construction failed: startIndex is negative");
213     if (test1d->endIndex() > testText.length())
214         errln("Construction failed: endIndex is greater than the text length");
215     if (test1d->getIndex() < test1d->startIndex() || test1d->endIndex() < test1d->getIndex())
216         errln("Construction failed: index is invalid");
217 
218     if (*test1 == *test2 || *test1 == *test3 || *test1 == *test4)
219         errln("Construction or operator== failed: Unequal objects compared equal");
220     if (*test1 != *test5)
221         errln("clone() or equals() failed: Two clones tested unequal");
222 
223     if (test1->hashCode() == test2->hashCode() || test1->hashCode() == test3->hashCode()
224                     || test1->hashCode() == test4->hashCode())
225         errln("hashCode() failed:  different objects have same hash code");
226 
227     if (test1->hashCode() != test5->hashCode())
228         errln("hashCode() failed:  identical objects have different hash codes");
229 
230     if(test1->getLength() != testText.length()){
231         errln("getLength of CharacterIterator failed");
232     }
233     test1->getText(result1);
234     test1b->getText(result2);
235     test1c->getText(result3);
236     if(result1 != result2 ||  result1 != result3)
237         errln("construction failed or getText() failed");
238 
239 
240     test1->setIndex(5);
241     if (*test1 != *test2 || *test1 == *test5)
242         errln("setIndex() failed");
243 
244     *((StringCharacterIterator*)test1) = *((StringCharacterIterator*)test3);
245     if (*test1 != *test3 || *test1 == *test5)
246         errln("operator= failed");
247 
248     delete test2;
249     delete test3;
250     delete test4;
251     delete test5;
252     delete test1b;
253     delete test1c;
254     delete test1d;
255     delete test1e;
256 
257 
258     StringCharacterIterator* testChar1=new StringCharacterIterator(testText);
259     StringCharacterIterator* testChar2=new StringCharacterIterator(testText2);
260     StringCharacterIterator* testChar3=(StringCharacterIterator*)test1->clone();
261 
262     testChar1->getText(result1);
263     testChar2->getText(result2);
264     testChar3->getText(result3);
265     if(result1 != result3 || result1 == result2)
266         errln("getText() failed");
267     testChar3->setText(testText2);
268     testChar3->getText(result3);
269     if(result1 == result3 || result2 != result3)
270         errln("setText() or getText() failed");
271     testChar3->setText(testText);
272     testChar3->getText(result3);
273     if(result1 != result3 || result1 == result2)
274         errln("setText() or getText() round-trip failed");
275 
276     delete testChar1;
277     delete testChar2;
278     delete testChar3;
279     delete test1;
280 
281 }
TestConstructionAndEqualityUChariter()282 void CharIterTest::TestConstructionAndEqualityUChariter() {
283     U_STRING_DECL(testText, "Now is the time for all good men to come to the aid of their country.", 69);
284     U_STRING_DECL(testText2, "Don't bother using this string.", 31);
285 
286     U_STRING_INIT(testText, "Now is the time for all good men to come to the aid of their country.", 69);
287     U_STRING_INIT(testText2, "Don't bother using this string.", 31);
288 
289     UnicodeString result, result4, result5;
290 
291     UCharCharacterIterator* test1 = new UCharCharacterIterator(testText, u_strlen(testText));
292     UCharCharacterIterator* test2 = new UCharCharacterIterator(testText, u_strlen(testText), 5);
293     UCharCharacterIterator* test3 = new UCharCharacterIterator(testText, u_strlen(testText), 2, 20, 5);
294     UCharCharacterIterator* test4 = new UCharCharacterIterator(testText2, u_strlen(testText2));
295     UCharCharacterIterator* test5 = (UCharCharacterIterator*)test1->clone();
296     UCharCharacterIterator* test6 = new UCharCharacterIterator(*test1);
297 
298     // j785: length=-1 will use u_strlen()
299     UCharCharacterIterator* test7a = new UCharCharacterIterator(testText, -1);
300     UCharCharacterIterator* test7b = new UCharCharacterIterator(testText, -1);
301     UCharCharacterIterator* test7c = new UCharCharacterIterator(testText, -1, 2, 20, 5);
302 
303     // Bad parameters.
304     UCharCharacterIterator* test8a = new UCharCharacterIterator(testText, -1, -1, 20, 5);
305     UCharCharacterIterator* test8b = new UCharCharacterIterator(testText, -1, 2, 100, 5);
306     UCharCharacterIterator* test8c = new UCharCharacterIterator(testText, -1, 2, 20, 100);
307 
308     if (test8a->startIndex() < 0)
309         errln("Construction failed: startIndex is negative");
310     if (test8b->endIndex() != u_strlen(testText))
311         errln("Construction failed: endIndex is different from the text length");
312     if (test8c->getIndex() < test8c->startIndex() || test8c->endIndex() < test8c->getIndex())
313         errln("Construction failed: index is invalid");
314 
315     if (*test1 == *test2 || *test1 == *test3 || *test1 == *test4 )
316         errln("Construction or operator== failed: Unequal objects compared equal");
317     if (*test1 != *test5 )
318         errln("clone() or equals() failed: Two clones tested unequal");
319 
320     if (*test6 != *test1 )
321         errln("copy construction or equals() failed: Two copies tested unequal");
322 
323     if (test1->hashCode() == test2->hashCode() || test1->hashCode() == test3->hashCode()
324                     || test1->hashCode() == test4->hashCode())
325         errln("hashCode() failed:  different objects have same hash code");
326 
327     if (test1->hashCode() != test5->hashCode())
328         errln("hashCode() failed:  identical objects have different hash codes");
329 
330     test7a->getText(result);
331     test7b->getText(result4);
332     test7c->getText(result5);
333 
334     if(result != UnicodeString(testText) || result4 != result || result5 != result)
335         errln("error in construction");
336 
337     test1->getText(result);
338     test4->getText(result4);
339     test5->getText(result5);
340     if(result != result5 || result == result4)
341         errln("getText() failed");
342     test5->setText(testText2, u_strlen(testText2));
343     test5->getText(result5);
344     if(result == result5 || result4 != result5)
345         errln("setText() or getText() failed");
346     test5->setText(testText, u_strlen(testText));
347     test5->getText(result5);
348     if(result != result5 || result == result4)
349         errln("setText() or getText() round-trip failed");
350 
351 
352     test1->setIndex(5);
353     if (*test1 != *test2 || *test1 == *test5)
354         errln("setIndex() failed");
355     test8b->setIndex32(5);
356     if (test8b->getIndex()!=5)
357         errln("setIndex32() failed");
358 
359     *test1 = *test3;
360     if (*test1 != *test3 || *test1 == *test5)
361         errln("operator= failed");
362 
363     delete test1;
364     delete test2;
365     delete test3;
366     delete test4;
367     delete test5;
368     delete test6;
369     delete test7a;
370     delete test7b;
371     delete test7c;
372     delete test8a;
373     delete test8b;
374     delete test8c;
375 }
376 
377 
TestIteration()378 void CharIterTest::TestIteration() {
379     UnicodeString text("Now is the time for all good men to come to the aid of their country.");
380 
381     UChar c;
382     int32_t i;
383     {
384         StringCharacterIterator   iter(text, 5);
385 
386         UnicodeString iterText;
387         iter.getText(iterText);
388         if (iterText != text)
389           errln("iter.getText() failed");
390 
391         if (iter.current() != text[(int32_t)5])
392             errln("Iterator didn't start out in the right place.");
393 
394         c = iter.first();
395         i = 0;
396 
397         if (iter.startIndex() != 0 || iter.endIndex() != text.length())
398             errln("startIndex() or endIndex() failed");
399 
400         logln("Testing forward iteration...");
401         do {
402             if (c == CharacterIterator::DONE && i != text.length())
403                 errln("Iterator reached end prematurely");
404             else if (c != text[i])
405                 errln((UnicodeString)"Character mismatch at position " + i +
406                                     ", iterator has " + UCharToUnicodeString(c) +
407                                     ", string has " + UCharToUnicodeString(text[i]));
408 
409             if (iter.current() != c)
410                 errln("current() isn't working right");
411             if (iter.getIndex() != i)
412                 errln("getIndex() isn't working right");
413 
414             if (c != CharacterIterator::DONE) {
415                 c = iter.next();
416                 i++;
417             }
418         } while (c != CharacterIterator::DONE);
419         c=iter.next();
420         if(c!= CharacterIterator::DONE)
421             errln("next() didn't return DONE at the end");
422         c=iter.setIndex(text.length()+1);
423         if(c!= CharacterIterator::DONE)
424             errln("setIndex(len+1) didn't return DONE");
425 
426         c = iter.last();
427         i = text.length() - 1;
428 
429         logln("Testing backward iteration...");
430         do {
431             if (c == CharacterIterator::DONE && i >= 0)
432                 errln("Iterator reached end prematurely");
433             else if (c != text[i])
434                 errln((UnicodeString)"Character mismatch at position " + i +
435                                     ", iterator has " + UCharToUnicodeString(c) +
436                                     ", string has " + UCharToUnicodeString(text[i]));
437 
438             if (iter.current() != c)
439                 errln("current() isn't working right");
440             if (iter.getIndex() != i)
441                 errln("getIndex() isn't working right");
442             if(iter.setIndex(i) != c)
443                 errln("setIndex() isn't working right");
444 
445             if (c != CharacterIterator::DONE) {
446                 c = iter.previous();
447                 i--;
448             }
449         } while (c != CharacterIterator::DONE);
450 
451         c=iter.previous();
452         if(c!= CharacterIterator::DONE)
453             errln("previous didn't return DONE at the beginning");
454 
455 
456         //testing firstPostInc, nextPostInc, setTostart
457         i = 0;
458         c=iter.firstPostInc();
459         if(c != text[i])
460             errln((UnicodeString)"firstPostInc failed.  Expected->" +
461                          UCharToUnicodeString(text[i]) + " Got->" + UCharToUnicodeString(c));
462         if(iter.getIndex() != i+1)
463             errln((UnicodeString)"getIndex() after firstPostInc() failed");
464 
465         iter.setToStart();
466         i=0;
467         if (iter.startIndex() != 0)
468             errln("setToStart failed");
469 
470         logln("Testing forward iteration...");
471         do {
472             if (c != CharacterIterator::DONE)
473                 c = iter.nextPostInc();
474 
475             if(c != text[i])
476                 errln((UnicodeString)"Character mismatch at position " + i +
477                                     (UnicodeString)", iterator has " + UCharToUnicodeString(c) +
478                                     (UnicodeString)", string has " + UCharToUnicodeString(text[i]));
479 
480             i++;
481             if(iter.getIndex() != i)
482                 errln("getIndex() aftr nextPostInc() isn't working right");
483             if(iter.current() != text[i])
484                 errln("current() after nextPostInc() isn't working right");
485         } while (iter.hasNext());
486         c=iter.nextPostInc();
487         if(c!= CharacterIterator::DONE)
488             errln("nextPostInc() didn't return DONE at the beginning");
489     }
490 
491     {
492         StringCharacterIterator iter(text, 5, 15, 10);
493         if (iter.startIndex() != 5 || iter.endIndex() != 15)
494             errln("creation of a restricted-range iterator failed");
495 
496         if (iter.getIndex() != 10 || iter.current() != text[(int32_t)10])
497             errln("starting the iterator in the middle didn't work");
498 
499         c = iter.first();
500         i = 5;
501 
502         logln("Testing forward iteration over a range...");
503         do {
504             if (c == CharacterIterator::DONE && i != 15)
505                 errln("Iterator reached end prematurely");
506             else if (c != text[i])
507                 errln((UnicodeString)"Character mismatch at position " + i +
508                                     ", iterator has " + UCharToUnicodeString(c) +
509                                     ", string has " + UCharToUnicodeString(text[i]));
510 
511             if (iter.current() != c)
512                 errln("current() isn't working right");
513             if (iter.getIndex() != i)
514                 errln("getIndex() isn't working right");
515             if(iter.setIndex(i) != c)
516                 errln("setIndex() isn't working right");
517 
518             if (c != CharacterIterator::DONE) {
519                 c = iter.next();
520                 i++;
521             }
522         } while (c != CharacterIterator::DONE);
523 
524         c = iter.last();
525         i = 14;
526 
527         logln("Testing backward iteration over a range...");
528         do {
529             if (c == CharacterIterator::DONE && i >= 5)
530                 errln("Iterator reached end prematurely");
531             else if (c != text[i])
532                 errln((UnicodeString)"Character mismatch at position " + i +
533                                     ", iterator has " + UCharToUnicodeString(c) +
534                                     ", string has " + UCharToUnicodeString(text[i]));
535 
536             if (iter.current() != c)
537                 errln("current() isn't working right");
538             if (iter.getIndex() != i)
539                 errln("getIndex() isn't working right");
540 
541             if (c != CharacterIterator::DONE) {
542                 c = iter.previous();
543                 i--;
544             }
545         } while (c != CharacterIterator::DONE);
546 
547 
548     }
549 }
550 
551 //Tests for new API for utf-16 support
TestIterationUChar32()552 void CharIterTest::TestIterationUChar32() {
553     UChar textChars[]={ 0x0061, 0x0062, 0xd841, 0xdc02, 0x20ac, 0xd7ff, 0xd842, 0xdc06, 0xd801, 0xdc00, 0x0061, 0x0000};
554     UnicodeString text(textChars);
555     UChar32 c;
556     int32_t i;
557     {
558         StringCharacterIterator   iter(text, 1);
559 
560         UnicodeString iterText;
561         iter.getText(iterText);
562         if (iterText != text)
563           errln("iter.getText() failed");
564 
565         if (iter.current32() != text[(int32_t)1])
566             errln("Iterator didn't start out in the right place.");
567 
568         c=iter.setToStart();
569         i=0;
570         i=iter.move32(1, CharacterIterator::kStart);
571         c=iter.current32();
572         if(c != text.char32At(1) || i!=1)
573             errln("move32(1, kStart) didn't work correctly expected %X got %X", c, text.char32At(1) );
574 
575         i=iter.move32(2, CharacterIterator::kCurrent);
576         c=iter.current32();
577         if(c != text.char32At(4) || i!=4)
578             errln("move32(2, kCurrent) didn't work correctly expected %X got %X i=%ld", c, text.char32At(4), i);
579 
580         i=iter.move32(-2, CharacterIterator::kCurrent);
581         c=iter.current32();
582         if(c != text.char32At(1) || i!=1)
583             errln("move32(-2, kCurrent) didn't work correctly expected %X got %X i=%d", c, text.char32At(1), i);
584 
585 
586         i=iter.move32(-2, CharacterIterator::kEnd);
587         c=iter.current32();
588         if(c != text.char32At((text.length()-3)) || i!=(text.length()-3))
589             errln("move32(-2, kEnd) didn't work correctly expected %X got %X i=%d", c, text.char32At((text.length()-3)), i);
590 
591 
592         c = iter.first32();
593         i = 0;
594 
595         if (iter.startIndex() != 0 || iter.endIndex() != text.length())
596             errln("startIndex() or endIndex() failed");
597 
598         logln("Testing forward iteration...");
599         do {
600             /* logln("c=%d i=%d char32At=%d", c, i, text.char32At(i)); */
601             if (c == CharacterIterator::DONE && i != text.length())
602                 errln("Iterator reached end prematurely");
603             else if(iter.hasNext() == FALSE && i != text.length())
604                 errln("Iterator reached end prematurely.  Failed at hasNext");
605             else if (c != text.char32At(i))
606                 errln("Character mismatch at position %d, iterator has %X, string has %X", i, c, text.char32At(i));
607 
608             if (iter.current32() != c)
609                 errln("current32() isn't working right");
610             if(iter.setIndex32(i) != c)
611                 errln("setIndex32() isn't working right");
612             if (c != CharacterIterator::DONE) {
613                 c = iter.next32();
614                 i=UTF16_NEED_MULTIPLE_UCHAR(c) ? i+2 : i+1;
615             }
616         } while (c != CharacterIterator::DONE);
617         if(iter.hasNext() == TRUE)
618            errln("hasNext() returned true at the end of the string");
619 
620 
621 
622         c=iter.setToEnd();
623         if(iter.getIndex() != text.length() || iter.hasNext() != FALSE)
624             errln("setToEnd failed");
625 
626         c=iter.next32();
627         if(c!= CharacterIterator::DONE)
628             errln("next32 didn't return DONE at the end");
629         c=iter.setIndex32(text.length()+1);
630         if(c!= CharacterIterator::DONE)
631             errln("setIndex32(len+1) didn't return DONE");
632 
633 
634         c = iter.last32();
635         i = text.length()-1;
636         logln("Testing backward iteration...");
637         do {
638             if (c == CharacterIterator::DONE && i >= 0)
639                 errln((UnicodeString)"Iterator reached start prematurely for i=" + i);
640             else if(iter.hasPrevious() == FALSE && i>0)
641                 errln((UnicodeString)"Iterator reached start prematurely for i=" + i);
642             else if (c != text.char32At(i))
643                 errln("Character mismatch at position %d, iterator has %X, string has %X", i, c, text.char32At(i));
644 
645             if (iter.current32() != c)
646                 errln("current32() isn't working right");
647             if(iter.setIndex32(i) != c)
648                 errln("setIndex32() isn't working right");
649             if (iter.getIndex() != i)
650                 errln("getIndex() isn't working right");
651             if (c != CharacterIterator::DONE) {
652                 c = iter.previous32();
653                 i=UTF16_NEED_MULTIPLE_UCHAR(c) ? i-2 : i-1;
654             }
655         } while (c != CharacterIterator::DONE);
656         if(iter.hasPrevious() == TRUE)
657             errln("hasPrevious returned true after reaching the start");
658 
659         c=iter.previous32();
660         if(c!= CharacterIterator::DONE)
661             errln("previous32 didn't return DONE at the beginning");
662 
663 
664 
665 
666         //testing first32PostInc, next32PostInc, setTostart
667         i = 0;
668         c=iter.first32PostInc();
669         if(c != text.char32At(i))
670             errln("first32PostInc failed.  Expected->%X Got->%X", text.char32At(i), c);
671         if(iter.getIndex() != U16_LENGTH(c) + i)
672             errln((UnicodeString)"getIndex() after first32PostInc() failed");
673 
674         iter.setToStart();
675         i=0;
676         if (iter.startIndex() != 0)
677             errln("setToStart failed");
678 
679         logln("Testing forward iteration...");
680         do {
681             if (c != CharacterIterator::DONE)
682                 c = iter.next32PostInc();
683 
684             if(c != text.char32At(i))
685                 errln("Character mismatch at position %d, iterator has %X, string has %X", i, c, text.char32At(i));
686 
687             i=UTF16_NEED_MULTIPLE_UCHAR(c) ? i+2 : i+1;
688             if(iter.getIndex() != i)
689                 errln("getIndex() aftr next32PostInc() isn't working right");
690             if(iter.current32() != text.char32At(i))
691                 errln("current() after next32PostInc() isn't working right");
692         } while (iter.hasNext());
693         c=iter.next32PostInc();
694         if(c!= CharacterIterator::DONE)
695             errln("next32PostInc() didn't return DONE at the beginning");
696 
697 
698     }
699 
700     {
701         StringCharacterIterator iter(text, 1, 11, 10);
702         if (iter.startIndex() != 1 || iter.endIndex() != 11)
703             errln("creation of a restricted-range iterator failed");
704 
705         if (iter.getIndex() != 10 || iter.current32() != text.char32At(10))
706             errln("starting the iterator in the middle didn't work");
707 
708         c = iter.first32();
709 
710         i = 1;
711 
712         logln("Testing forward iteration over a range...");
713         do {
714             if (c == CharacterIterator::DONE && i != 11)
715                 errln("Iterator reached end prematurely");
716             else if(iter.hasNext() == FALSE)
717                 errln("Iterator reached end prematurely");
718             else if (c != text.char32At(i))
719                 errln("Character mismatch at position %d, iterator has %X, string has %X", i, c, text.char32At(i));
720 
721             if (iter.current32() != c)
722                 errln("current32() isn't working right");
723             if(iter.setIndex32(i) != c)
724                 errln("setIndex32() isn't working right");
725 
726             if (c != CharacterIterator::DONE) {
727                 c = iter.next32();
728                 i=UTF16_NEED_MULTIPLE_UCHAR(c) ? i+2 : i+1;
729             }
730         } while (c != CharacterIterator::DONE);
731         c=iter.next32();
732         if(c != CharacterIterator::DONE)
733             errln("error in next32()");
734 
735 
736 
737         c=iter.last32();
738         i = 10;
739         logln("Testing backward iteration over a range...");
740         do {
741             if (c == CharacterIterator::DONE && i >= 5)
742                 errln("Iterator reached start prematurely");
743             else if(iter.hasPrevious() == FALSE && i > 5)
744                 errln("Iterator reached start prematurely");
745             else if (c != text.char32At(i))
746                 errln("Character mismatch at position %d, iterator has %X, string has %X", i, c, text.char32At(i));
747             if (iter.current32() != c)
748                 errln("current32() isn't working right");
749             if (iter.getIndex() != i)
750                 errln("getIndex() isn't working right");
751             if(iter.setIndex32(i) != c)
752                 errln("setIndex32() isn't working right");
753 
754             if (c != CharacterIterator::DONE) {
755                 c = iter.previous32();
756                 i=UTF16_NEED_MULTIPLE_UCHAR(c) ? i-2 : i-1;
757             }
758 
759         } while (c != CharacterIterator::DONE);
760         c=iter.previous32();
761         if(c!= CharacterIterator::DONE)
762             errln("error on previous32");
763 
764 
765     }
766 }
767 
TestUCharIterator(UCharIterator * iter,CharacterIterator & ci,const char * moves,const char * which)768 void CharIterTest::TestUCharIterator(UCharIterator *iter, CharacterIterator &ci,
769                                      const char *moves, const char *which) {
770     int32_t m;
771     UChar32 c, c2;
772     UBool h, h2;
773 
774     for(m=0;; ++m) {
775         // move both iter and s[index]
776         switch(moves[m]) {
777         case '0':
778             h=iter->hasNext(iter);
779             h2=ci.hasNext();
780             c=iter->current(iter);
781             c2=ci.current();
782             break;
783         case '|':
784             h=iter->hasNext(iter);
785             h2=ci.hasNext();
786             c=uiter_current32(iter);
787             c2=ci.current32();
788             break;
789 
790         case '+':
791             h=iter->hasNext(iter);
792             h2=ci.hasNext();
793             c=iter->next(iter);
794             c2=ci.nextPostInc();
795             break;
796         case '>':
797             h=iter->hasNext(iter);
798             h2=ci.hasNext();
799             c=uiter_next32(iter);
800             c2=ci.next32PostInc();
801             break;
802 
803         case '-':
804             h=iter->hasPrevious(iter);
805             h2=ci.hasPrevious();
806             c=iter->previous(iter);
807             c2=ci.previous();
808             break;
809         case '<':
810             h=iter->hasPrevious(iter);
811             h2=ci.hasPrevious();
812             c=uiter_previous32(iter);
813             c2=ci.previous32();
814             break;
815 
816         case '2':
817             h=h2=FALSE;
818             c=(UChar32)iter->move(iter, 2, UITER_CURRENT);
819             c2=(UChar32)ci.move(2, CharacterIterator::kCurrent);
820             break;
821 
822         case '8':
823             h=h2=FALSE;
824             c=(UChar32)iter->move(iter, -2, UITER_CURRENT);
825             c2=(UChar32)ci.move(-2, CharacterIterator::kCurrent);
826             break;
827 
828         case 0:
829             return;
830         default:
831             errln("error: unexpected move character '%c' in \"%s\"", moves[m], moves);
832             return;
833         }
834 
835         // compare results
836         if(c2==0xffff) {
837             c2=(UChar32)-1;
838         }
839         if(c!=c2 || h!=h2 || ci.getIndex()!=iter->getIndex(iter, UITER_CURRENT)) {
840             errln("error: UCharIterator(%s) misbehaving at \"%s\"[%d]='%c'", which, moves, m, moves[m]);
841         }
842     }
843 }
844 
TestUCharIterator()845 void CharIterTest::TestUCharIterator() {
846     // test string of length 8
847     UnicodeString s=UnicodeString("a \\U00010001b\\U0010fffdz", "").unescape();
848     const char *const moves=
849         "0+++++++++" // 10 moves per line
850         "----0-----"
851         ">>|>>>>>>>"
852         "<<|<<<<<<<"
853         "22+>8>-8+2";
854 
855     StringCharacterIterator sci(s), compareCI(s);
856 
857     UCharIterator sIter, cIter, rIter;
858 
859     uiter_setString(&sIter, s.getBuffer(), s.length());
860     uiter_setCharacterIterator(&cIter, &sci);
861     uiter_setReplaceable(&rIter, &s);
862 
863     TestUCharIterator(&sIter, compareCI, moves, "uiter_setString");
864     compareCI.setIndex(0);
865     TestUCharIterator(&cIter, compareCI, moves, "uiter_setCharacterIterator");
866     compareCI.setIndex(0);
867     TestUCharIterator(&rIter, compareCI, moves, "uiter_setReplaceable");
868 
869     // test move & getIndex some more
870     sIter.start=2;
871     sIter.index=3;
872     sIter.limit=5;
873     if( sIter.getIndex(&sIter, UITER_ZERO)!=0 ||
874         sIter.getIndex(&sIter, UITER_START)!=2 ||
875         sIter.getIndex(&sIter, UITER_CURRENT)!=3 ||
876         sIter.getIndex(&sIter, UITER_LIMIT)!=5 ||
877         sIter.getIndex(&sIter, UITER_LENGTH)!=s.length()
878     ) {
879         errln("error: UCharIterator(string).getIndex returns wrong index");
880     }
881 
882     if( sIter.move(&sIter, 4, UITER_ZERO)!=4 ||
883         sIter.move(&sIter, 1, UITER_START)!=3 ||
884         sIter.move(&sIter, 3, UITER_CURRENT)!=5 ||
885         sIter.move(&sIter, -1, UITER_LIMIT)!=4 ||
886         sIter.move(&sIter, -5, UITER_LENGTH)!=3 ||
887         sIter.move(&sIter, 0, UITER_CURRENT)!=sIter.getIndex(&sIter, UITER_CURRENT) ||
888         sIter.getIndex(&sIter, UITER_CURRENT)!=3
889     ) {
890         errln("error: UCharIterator(string).move sets/returns wrong index");
891     }
892 
893     sci=StringCharacterIterator(s, 2, 5, 3);
894     uiter_setCharacterIterator(&cIter, &sci);
895     if( cIter.getIndex(&cIter, UITER_ZERO)!=0 ||
896         cIter.getIndex(&cIter, UITER_START)!=2 ||
897         cIter.getIndex(&cIter, UITER_CURRENT)!=3 ||
898         cIter.getIndex(&cIter, UITER_LIMIT)!=5 ||
899         cIter.getIndex(&cIter, UITER_LENGTH)!=s.length()
900     ) {
901         errln("error: UCharIterator(character iterator).getIndex returns wrong index");
902     }
903 
904     if( cIter.move(&cIter, 4, UITER_ZERO)!=4 ||
905         cIter.move(&cIter, 1, UITER_START)!=3 ||
906         cIter.move(&cIter, 3, UITER_CURRENT)!=5 ||
907         cIter.move(&cIter, -1, UITER_LIMIT)!=4 ||
908         cIter.move(&cIter, -5, UITER_LENGTH)!=3 ||
909         cIter.move(&cIter, 0, UITER_CURRENT)!=cIter.getIndex(&cIter, UITER_CURRENT) ||
910         cIter.getIndex(&cIter, UITER_CURRENT)!=3
911     ) {
912         errln("error: UCharIterator(character iterator).move sets/returns wrong index");
913     }
914 
915 
916     if(cIter.getIndex(&cIter, (enum UCharIteratorOrigin)-1) != -1)
917     {
918         errln("error: UCharIterator(char iter).getIndex did not return error value");
919     }
920 
921     if(cIter.move(&cIter, 0, (enum UCharIteratorOrigin)-1) != -1)
922     {
923         errln("error: UCharIterator(char iter).move did not return error value");
924     }
925 
926 
927     if(rIter.getIndex(&rIter, (enum UCharIteratorOrigin)-1) != -1)
928     {
929         errln("error: UCharIterator(repl iter).getIndex did not return error value");
930     }
931 
932     if(rIter.move(&rIter, 0, (enum UCharIteratorOrigin)-1) != -1)
933     {
934         errln("error: UCharIterator(repl iter).move did not return error value");
935     }
936 
937 
938     if(sIter.getIndex(&sIter, (enum UCharIteratorOrigin)-1) != -1)
939     {
940         errln("error: UCharIterator(string iter).getIndex did not return error value");
941     }
942 
943     if(sIter.move(&sIter, 0, (enum UCharIteratorOrigin)-1) != -1)
944     {
945         errln("error: UCharIterator(string iter).move did not return error value");
946     }
947 
948     /* Testing function coverage on bad input */
949     UErrorCode status = U_ZERO_ERROR;
950     uiter_setString(&sIter, NULL, 1);
951     uiter_setState(&sIter, 1, &status);
952     if (status != U_UNSUPPORTED_ERROR) {
953         errln("error: uiter_setState returned %s instead of U_UNSUPPORTED_ERROR", u_errorName(status));
954     }
955     status = U_ZERO_ERROR;
956     uiter_setState(NULL, 1, &status);
957     if (status != U_ILLEGAL_ARGUMENT_ERROR) {
958         errln("error: uiter_setState returned %s instead of U_ILLEGAL_ARGUMENT_ERROR", u_errorName(status));
959     }
960     if (uiter_getState(&sIter) != UITER_NO_STATE) {
961         errln("error: uiter_getState did not return UITER_NO_STATE on bad input");
962     }
963 }
964 
965 // subclass test, and completing API coverage -------------------------------
966 
967 class SubCharIter : public CharacterIterator {
968 public:
969     // public default constructor, to get coverage of CharacterIterator()
SubCharIter()970     SubCharIter() : CharacterIterator() {
971         textLength=end=UPRV_LENGTHOF(s);
972         s[0]=0x61;      // 'a'
973         s[1]=0xd900;    // U+50400
974         s[2]=0xdd00;
975         s[3]=0x2029;    // PS
976     }
977 
978     // useful stuff, mostly dummy but testing coverage and subclassability
nextPostInc()979     virtual UChar nextPostInc() {
980         if(pos<UPRV_LENGTHOF(s)) {
981             return s[pos++];
982         } else {
983             return DONE;
984         }
985     }
986 
next32PostInc()987     virtual UChar32 next32PostInc() {
988         if(pos<UPRV_LENGTHOF(s)) {
989             UChar32 c;
990             U16_NEXT(s, pos, UPRV_LENGTHOF(s), c);
991             return c;
992         } else {
993             return DONE;
994         }
995     }
996 
hasNext()997     virtual UBool hasNext() {
998         return pos<UPRV_LENGTHOF(s);
999     }
1000 
first()1001     virtual UChar first() {
1002         pos=0;
1003         return s[0];
1004     }
1005 
first32()1006     virtual UChar32 first32() {
1007         UChar32 c;
1008         pos=0;
1009         U16_NEXT(s, pos, UPRV_LENGTHOF(s), c);
1010         pos=0;
1011         return c;
1012     }
1013 
setIndex(int32_t position)1014     virtual UChar setIndex(int32_t position) {
1015         if(0<=position && position<=UPRV_LENGTHOF(s)) {
1016             pos=position;
1017             if(pos<UPRV_LENGTHOF(s)) {
1018                 return s[pos];
1019             }
1020         }
1021         return DONE;
1022     }
1023 
setIndex32(int32_t position)1024     virtual UChar32 setIndex32(int32_t position) {
1025         if(0<=position && position<=UPRV_LENGTHOF(s)) {
1026             pos=position;
1027             if(pos<UPRV_LENGTHOF(s)) {
1028                 UChar32 c;
1029                 U16_GET(s, 0, pos, UPRV_LENGTHOF(s), c);
1030                 return c;
1031             }
1032         }
1033         return DONE;
1034     }
1035 
current() const1036     virtual UChar current() const {
1037         if(pos<UPRV_LENGTHOF(s)) {
1038             return s[pos];
1039         } else {
1040             return DONE;
1041         }
1042     }
1043 
current32() const1044     virtual UChar32 current32() const {
1045         if(pos<UPRV_LENGTHOF(s)) {
1046             UChar32 c;
1047             U16_GET(s, 0, pos, UPRV_LENGTHOF(s), c);
1048             return c;
1049         } else {
1050             return DONE;
1051         }
1052     }
1053 
next()1054     virtual UChar next() {
1055         if(pos<UPRV_LENGTHOF(s) && ++pos<UPRV_LENGTHOF(s)) {
1056             return s[pos];
1057         } else {
1058             return DONE;
1059         }
1060     }
1061 
next32()1062     virtual UChar32 next32() {
1063         if(pos<UPRV_LENGTHOF(s)) {
1064             U16_FWD_1(s, pos, UPRV_LENGTHOF(s));
1065         }
1066         if(pos<UPRV_LENGTHOF(s)) {
1067             UChar32 c;
1068             int32_t i=pos;
1069             U16_NEXT(s, i, UPRV_LENGTHOF(s), c);
1070             return c;
1071         } else {
1072             return DONE;
1073         }
1074     }
1075 
hasPrevious()1076     virtual UBool hasPrevious() {
1077         return pos>0;
1078     }
1079 
getText(UnicodeString & result)1080     virtual void getText(UnicodeString &result) {
1081         result.setTo(s, UPRV_LENGTHOF(s));
1082     }
1083 
1084     // dummy implementations of other pure virtual base class functions
operator ==(const ForwardCharacterIterator & that) const1085     virtual UBool operator==(const ForwardCharacterIterator &that) const {
1086         return
1087             this==&that ||
1088             (typeid(*this)==typeid(that) && pos==((SubCharIter &)that).pos);
1089     }
1090 
hashCode() const1091     virtual int32_t hashCode() const {
1092         return 2;
1093     }
1094 
clone() const1095     virtual CharacterIterator *clone() const {
1096         return NULL;
1097     }
1098 
last()1099     virtual UChar last() {
1100         return 0;
1101     }
1102 
last32()1103     virtual UChar32 last32() {
1104         return 0;
1105     }
1106 
previous()1107     virtual UChar previous() {
1108         return 0;
1109     }
1110 
previous32()1111     virtual UChar32 previous32() {
1112         return 0;
1113     }
1114 
move(int32_t,EOrigin)1115     virtual int32_t move(int32_t /*delta*/, EOrigin /*origin*/) {
1116         return 0;
1117     }
1118 
move32(int32_t,EOrigin)1119     virtual int32_t move32(int32_t /*delta*/, EOrigin /*origin*/) {
1120         return 0;
1121     }
1122 
1123     // RTTI
getStaticClassID()1124     static UClassID getStaticClassID() {
1125         return (UClassID)(&fgClassID);
1126     }
1127 
getDynamicClassID() const1128     virtual UClassID getDynamicClassID() const {
1129         return getStaticClassID();
1130     }
1131 
1132 private:
1133     // dummy string data
1134     UChar s[4];
1135 
1136     static const char fgClassID;
1137 };
1138 
1139 const char SubCharIter::fgClassID = 0;
1140 
1141 class SubStringCharIter : public StringCharacterIterator {
1142 public:
SubStringCharIter()1143     SubStringCharIter() {
1144         setText(UNICODE_STRING("abc", 3));
1145     }
1146 };
1147 
1148 class SubUCharCharIter : public UCharCharacterIterator {
1149 public:
SubUCharCharIter()1150     SubUCharCharIter() {
1151         setText(u, 3);
1152     }
1153 
1154 private:
1155     static const UChar u[3];
1156 };
1157 
1158 const UChar SubUCharCharIter::u[3]={ 0x61, 0x62, 0x63 };
1159 
TestCharIteratorSubClasses()1160 void CharIterTest::TestCharIteratorSubClasses() {
1161     SubCharIter *p;
1162 
1163     // coverage - call functions that are not otherwise tested
1164     // first[32]PostInc() are default implementations that are overridden
1165     // in ICU's own CharacterIterator subclasses
1166     p=new SubCharIter;
1167     if(p->firstPostInc()!=0x61) {
1168         errln("SubCharIter.firstPosInc() failed\n");
1169     }
1170     delete p;
1171 
1172     p=new SubCharIter[2];
1173     if(p[1].first32PostInc()!=0x61) {
1174         errln("SubCharIter.first32PosInc() failed\n");
1175     }
1176     delete [] p;
1177 
1178     // coverage: StringCharacterIterator default constructor
1179     SubStringCharIter sci;
1180     if(sci.firstPostInc()!=0x61) {
1181         errln("SubStringCharIter.firstPostInc() failed\n");
1182     }
1183 
1184     // coverage: UCharCharacterIterator default constructor
1185     SubUCharCharIter uci;
1186     if(uci.firstPostInc()!=0x61) {
1187         errln("SubUCharCharIter.firstPostInc() failed\n");
1188     }
1189 }
1190