1 // © 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /*
4 ******************************************************************************
5 *
6 *   Copyright (C) 2001-2016, International Business Machines
7 *   Corporation and others.  All Rights Reserved.
8 *
9 ******************************************************************************
10 *   file name:  trietest.c
11 *   encoding:   UTF-8
12 *   tab size:   8 (not used)
13 *   indentation:4
14 *
15 *   created on: 2001nov20
16 *   created by: Markus W. Scherer
17 */
18 
19 #include <stdio.h>
20 #include "unicode/utypes.h"
21 #include "unicode/utf16.h"
22 #include "utrie.h"
23 #include "cstring.h"
24 #include "cmemory.h"
25 
26 #if 1
27 #include "cintltst.h"
28 #else
29 /* definitions from standalone utrie development */
30 #define log_err printf
31 #define log_verbose printf
32 
33 #undef u_errorName
34 #define u_errorName(errorCode) "some error code"
35 #endif
36 
37 /* Values for setting possibly overlapping, out-of-order ranges of values */
38 typedef struct SetRange {
39     UChar32 start, limit;
40     uint32_t value;
41     UBool overwrite;
42 } SetRange;
43 
44 /*
45  * Values for testing:
46  * value is set from the previous boundary's limit to before
47  * this boundary's limit
48  */
49 typedef struct CheckRange {
50     UChar32 limit;
51     uint32_t value;
52 } CheckRange;
53 
54 
55 static uint32_t U_CALLCONV
_testFoldedValue32(UNewTrie * trie,UChar32 start,int32_t offset)56 _testFoldedValue32(UNewTrie *trie, UChar32 start, int32_t offset) {
57     uint32_t foldedValue, value;
58     UChar32 limit;
59     UBool inBlockZero;
60 
61     foldedValue=0;
62 
63     limit=start+0x400;
64     while(start<limit) {
65         value=utrie_get32(trie, start, &inBlockZero);
66         if(inBlockZero) {
67             start+=UTRIE_DATA_BLOCK_LENGTH;
68         } else {
69             foldedValue|=value;
70             ++start;
71         }
72     }
73 
74     if(foldedValue!=0) {
75         return ((uint32_t)offset<<16)|foldedValue;
76     } else {
77         return 0;
78     }
79 }
80 
81 static int32_t U_CALLCONV
_testFoldingOffset32(uint32_t data)82 _testFoldingOffset32(uint32_t data) {
83     return (int32_t)(data>>16);
84 }
85 
86 static uint32_t U_CALLCONV
_testFoldedValue16(UNewTrie * trie,UChar32 start,int32_t offset)87 _testFoldedValue16(UNewTrie *trie, UChar32 start, int32_t offset) {
88     uint32_t foldedValue, value;
89     UChar32 limit;
90     UBool inBlockZero;
91 
92     foldedValue=0;
93 
94     limit=start+0x400;
95     while(start<limit) {
96         value=utrie_get32(trie, start, &inBlockZero);
97         if(inBlockZero) {
98             start+=UTRIE_DATA_BLOCK_LENGTH;
99         } else {
100             foldedValue|=value;
101             ++start;
102         }
103     }
104 
105     if(foldedValue!=0) {
106         return (uint32_t)(offset|0x8000);
107     } else {
108         return 0;
109     }
110 }
111 
112 static int32_t U_CALLCONV
_testFoldingOffset16(uint32_t data)113 _testFoldingOffset16(uint32_t data) {
114     if(data&0x8000) {
115         return (int32_t)(data&0x7fff);
116     } else {
117         return 0;
118     }
119 }
120 
121 static uint32_t U_CALLCONV
_testEnumValue(const void * context,uint32_t value)122 _testEnumValue(const void *context, uint32_t value) {
123     return value^0x5555;
124 }
125 
126 static UBool U_CALLCONV
_testEnumRange(const void * context,UChar32 start,UChar32 limit,uint32_t value)127 _testEnumRange(const void *context, UChar32 start, UChar32 limit, uint32_t value) {
128     const CheckRange **pb=(const CheckRange **)context;
129     const CheckRange *b=(*pb)++;
130 
131     value^=0x5555;
132     if(start!=(b-1)->limit || limit!=b->limit || value!=b->value) {
133         log_err("error: utrie_enum() delivers wrong range [U+%04lx..U+%04lx[.0x%lx instead of [U+%04lx..U+%04lx[.0x%lx\n",
134             start, limit, value,
135             (b-1)->limit, b->limit, b->value);
136     }
137     return TRUE;
138 }
139 
140 static void
testTrieIteration(const char * testName,const UTrie * trie,const CheckRange checkRanges[],int32_t countCheckRanges)141 testTrieIteration(const char *testName,
142                   const UTrie *trie,
143                   const CheckRange checkRanges[], int32_t countCheckRanges) {
144     UChar s[100];
145     uint32_t values[30];
146 
147     const UChar *p, *limit;
148 
149     uint32_t value;
150     UChar32 c;
151     int32_t i, length, countValues;
152     UChar c2;
153 
154     /* write a string */
155     length=countValues=0;
156     for(i=0; i<countCheckRanges; ++i) {
157         c=checkRanges[i].limit;
158         if(c!=0) {
159             --c;
160             U16_APPEND_UNSAFE(s, length, c);
161             values[countValues++]=checkRanges[i].value;
162         }
163     }
164     limit=s+length;
165 
166     /* try forward */
167     p=s;
168     i=0;
169     while(p<limit) {
170         c=c2=0x33;
171         if(trie->data32!=NULL) {
172             UTRIE_NEXT32(trie, p, limit, c, c2, value);
173         } else {
174             UTRIE_NEXT16(trie, p, limit, c, c2, value);
175         }
176         if(value!=values[i]) {
177             log_err("error: wrong value from UTRIE_NEXT(%s)(U+%04lx, U+%04lx): 0x%lx instead of 0x%lx\n",
178                     testName, c, c2, value, values[i]);
179         }
180         if(
181             c2==0 ?
182                 c!=*(p-1) :
183                 !U16_IS_LEAD(c) || !U16_IS_TRAIL(c2) || c!=*(p-2) || c2!=*(p-1)
184         ) {
185             log_err("error: wrong (c, c2) from UTRIE_NEXT(%s): (U+%04lx, U+%04lx)\n",
186                     testName, c, c2);
187             continue;
188         }
189         if(c2!=0) {
190             int32_t offset;
191 
192             if(trie->data32==NULL) {
193                 value=UTRIE_GET16_FROM_LEAD(trie, c);
194                 offset=trie->getFoldingOffset(value);
195                 if(offset>0) {
196                     value=UTRIE_GET16_FROM_OFFSET_TRAIL(trie, offset, c2);
197                 } else {
198                     value=trie->initialValue;
199                 }
200             } else {
201                 value=UTRIE_GET32_FROM_LEAD(trie, c);
202                 offset=trie->getFoldingOffset(value);
203                 if(offset>0) {
204                     value=UTRIE_GET32_FROM_OFFSET_TRAIL(trie, offset, c2);
205                 } else {
206                     value=trie->initialValue;
207                 }
208             }
209             if(value!=values[i]) {
210                 log_err("error: wrong value from UTRIE_GETXX_FROM_OFFSET_TRAIL(%s)(U+%04lx, U+%04lx): 0x%lx instead of 0x%lx\n",
211                         testName, c, c2, value, values[i]);
212             }
213         }
214         if(c2!=0) {
215             value=0x44;
216             if(trie->data32==NULL) {
217                 UTRIE_GET16_FROM_PAIR(trie, c, c2, value);
218             } else {
219                 UTRIE_GET32_FROM_PAIR(trie, c, c2, value);
220             }
221             if(value!=values[i]) {
222                 log_err("error: wrong value from UTRIE_GETXX_FROM_PAIR(%s)(U+%04lx, U+%04lx): 0x%lx instead of 0x%lx\n",
223                         testName, c, c2, value, values[i]);
224             }
225         }
226         ++i;
227     }
228 
229     /* try backward */
230     p=limit;
231     i=countValues;
232     while(s<p) {
233         --i;
234         c=c2=0x33;
235         if(trie->data32!=NULL) {
236             UTRIE_PREVIOUS32(trie, s, p, c, c2, value);
237         } else {
238             UTRIE_PREVIOUS16(trie, s, p, c, c2, value);
239         }
240         if(value!=values[i]) {
241             log_err("error: wrong value from UTRIE_PREVIOUS(%s)(U+%04lx, U+%04lx): 0x%lx instead of 0x%lx\n",
242                     testName, c, c2, value, values[i]);
243         }
244         if(
245             c2==0 ?
246                 c!=*p:
247                 !U16_IS_LEAD(c) || !U16_IS_TRAIL(c2) || c!=*p || c2!=*(p+1)
248         ) {
249             log_err("error: wrong (c, c2) from UTRIE_PREVIOUS(%s): (U+%04lx, U+%04lx)\n",
250                     testName, c, c2);
251         }
252     }
253 }
254 
255 static void
testTrieRangesWithMalloc(const char * testName,const SetRange setRanges[],int32_t countSetRanges,const CheckRange checkRanges[],int32_t countCheckRanges,UBool dataIs32,UBool latin1Linear)256 testTrieRangesWithMalloc(const char *testName,
257                const SetRange setRanges[], int32_t countSetRanges,
258                const CheckRange checkRanges[], int32_t countCheckRanges,
259                UBool dataIs32, UBool latin1Linear) {
260     UTrieGetFoldingOffset *getFoldingOffset;
261     const CheckRange *enumRanges;
262     UNewTrie *newTrie;
263     UTrie trie={ 0 };
264     uint32_t value, value2;
265     UChar32 start, limit;
266     int32_t i, length;
267     UErrorCode errorCode;
268     UBool overwrite, ok;
269     uint8_t* storage =NULL;
270     static const int32_t DEFAULT_STORAGE_SIZE = 32768;
271     storage = (uint8_t*) uprv_malloc(sizeof(uint8_t)*DEFAULT_STORAGE_SIZE);
272 
273     log_verbose("\ntesting Trie '%s'\n", testName);
274     newTrie=utrie_open(NULL, NULL, 2000,
275                        checkRanges[0].value, checkRanges[0].value,
276                        latin1Linear);
277 
278     /* set values from setRanges[] */
279     ok=TRUE;
280     for(i=0; i<countSetRanges; ++i) {
281         start=setRanges[i].start;
282         limit=setRanges[i].limit;
283         value=setRanges[i].value;
284         overwrite=setRanges[i].overwrite;
285         if((limit-start)==1 && overwrite) {
286             ok&=utrie_set32(newTrie, start, value);
287         } else {
288             ok&=utrie_setRange32(newTrie, start, limit, value, overwrite);
289         }
290     }
291     if(!ok) {
292         log_err("error: setting values into a trie failed (%s)\n", testName);
293         return;
294     }
295 
296     /* verify that all these values are in the new Trie */
297     start=0;
298     for(i=0; i<countCheckRanges; ++i) {
299         limit=checkRanges[i].limit;
300         value=checkRanges[i].value;
301 
302         while(start<limit) {
303             if(value!=utrie_get32(newTrie, start, NULL)) {
304                 log_err("error: newTrie(%s)[U+%04lx]==0x%lx instead of 0x%lx\n",
305                         testName, start, utrie_get32(newTrie, start, NULL), value);
306             }
307             ++start;
308         }
309     }
310 
311     if(dataIs32) {
312         getFoldingOffset=_testFoldingOffset32;
313     } else {
314         getFoldingOffset=_testFoldingOffset16;
315     }
316 
317     errorCode=U_ZERO_ERROR;
318     length=utrie_serialize(newTrie, storage, DEFAULT_STORAGE_SIZE,
319                            dataIs32 ? _testFoldedValue32 : _testFoldedValue16,
320                            (UBool)!dataIs32,
321                            &errorCode);
322     if(U_FAILURE(errorCode)) {
323         log_err("error: utrie_serialize(%s) failed: %s\n", testName, u_errorName(errorCode));
324         utrie_close(newTrie);
325         return;
326     }
327 
328     /* test linear Latin-1 range from utrie_getData() */
329     if(latin1Linear) {
330         uint32_t *data;
331         int32_t dataLength;
332 
333         data=utrie_getData(newTrie, &dataLength);
334         start=0;
335         for(i=0; i<countCheckRanges && start<=0xff; ++i) {
336             limit=checkRanges[i].limit;
337             value=checkRanges[i].value;
338 
339             while(start<limit && start<=0xff) {
340                 if(value!=data[UTRIE_DATA_BLOCK_LENGTH+start]) {
341                     log_err("error: newTrie(%s).latin1Data[U+%04lx]==0x%lx instead of 0x%lx\n",
342                             testName, start, data[UTRIE_DATA_BLOCK_LENGTH+start], value);
343                 }
344                 ++start;
345             }
346         }
347     }
348 
349     utrie_close(newTrie);
350 
351     errorCode=U_ZERO_ERROR;
352     if(!utrie_unserialize(&trie, storage, length, &errorCode)) {
353         log_err("error: utrie_unserialize() failed, %s\n", u_errorName(errorCode));
354         return;
355     }
356     trie.getFoldingOffset=getFoldingOffset;
357 
358     if(dataIs32!=(trie.data32!=NULL)) {
359         log_err("error: trie serialization (%s) did not preserve 32-bitness\n", testName);
360     }
361     if(latin1Linear!=trie.isLatin1Linear) {
362         log_err("error: trie serialization (%s) did not preserve Latin-1-linearity\n", testName);
363     }
364 
365     /* verify that all these values are in the unserialized Trie */
366     start=0;
367     for(i=0; i<countCheckRanges; ++i) {
368         limit=checkRanges[i].limit;
369         value=checkRanges[i].value;
370 
371         if(start==0xd800) {
372             /* skip surrogates */
373             start=limit;
374             continue;
375         }
376 
377         while(start<limit) {
378             if(start<=0xffff) {
379                 if(dataIs32) {
380                     value2=UTRIE_GET32_FROM_BMP(&trie, start);
381                 } else {
382                     value2=UTRIE_GET16_FROM_BMP(&trie, start);
383                 }
384                 if(value!=value2) {
385                     log_err("error: unserialized trie(%s).fromBMP(U+%04lx)==0x%lx instead of 0x%lx\n",
386                             testName, start, value2, value);
387                 }
388                 if(!U16_IS_LEAD(start)) {
389                     if(dataIs32) {
390                         value2=UTRIE_GET32_FROM_LEAD(&trie, start);
391                     } else {
392                         value2=UTRIE_GET16_FROM_LEAD(&trie, start);
393                     }
394                     if(value!=value2) {
395                         log_err("error: unserialized trie(%s).fromLead(U+%04lx)==0x%lx instead of 0x%lx\n",
396                                 testName, start, value2, value);
397                     }
398                 }
399             }
400             if(dataIs32) {
401                 UTRIE_GET32(&trie, start, value2);
402             } else {
403                 UTRIE_GET16(&trie, start, value2);
404             }
405             if(value!=value2) {
406                 log_err("error: unserialized trie(%s).get(U+%04lx)==0x%lx instead of 0x%lx\n",
407                         testName, start, value2, value);
408             }
409             ++start;
410         }
411     }
412 
413     /* enumerate and verify all ranges */
414     enumRanges=checkRanges+1;
415     utrie_enum(&trie, _testEnumValue, _testEnumRange, &enumRanges);
416 
417     /* test linear Latin-1 range */
418     if(trie.isLatin1Linear) {
419         if(trie.data32!=NULL) {
420             const uint32_t *latin1=UTRIE_GET32_LATIN1(&trie);
421 
422             for(start=0; start<0x100; ++start) {
423                 if(latin1[start]!=UTRIE_GET32_FROM_LEAD(&trie, start)) {
424                     log_err("error: (%s) trie.latin1[U+%04lx]=0x%lx!=0x%lx=trie.get32(U+%04lx)\n",
425                             testName, start, latin1[start], UTRIE_GET32_FROM_LEAD(&trie, start), start);
426                 }
427             }
428         } else {
429             const uint16_t *latin1=UTRIE_GET16_LATIN1(&trie);
430 
431             for(start=0; start<0x100; ++start) {
432                 if(latin1[start]!=UTRIE_GET16_FROM_LEAD(&trie, start)) {
433                     log_err("error: (%s) trie.latin1[U+%04lx]=0x%lx!=0x%lx=trie.get16(U+%04lx)\n",
434                             testName, start, latin1[start], UTRIE_GET16_FROM_LEAD(&trie, start), start);
435                 }
436             }
437         }
438     }
439 
440     testTrieIteration(testName, &trie, checkRanges, countCheckRanges);
441     uprv_free(storage);
442 }
443 
444 static void
testTrieRanges(const char * testName,const SetRange setRanges[],int32_t countSetRanges,const CheckRange checkRanges[],int32_t countCheckRanges,UBool dataIs32,UBool latin1Linear)445 testTrieRanges(const char *testName,
446                const SetRange setRanges[], int32_t countSetRanges,
447                const CheckRange checkRanges[], int32_t countCheckRanges,
448                UBool dataIs32, UBool latin1Linear) {
449     union{
450         double bogus; /* needed for aligining the storage */
451         uint8_t storage[32768];
452     } storageHolder;
453     UTrieGetFoldingOffset *getFoldingOffset;
454     UNewTrieGetFoldedValue *getFoldedValue;
455     const CheckRange *enumRanges;
456     UNewTrie *newTrie;
457     UTrie trie={ 0 };
458     uint32_t value, value2;
459     UChar32 start, limit;
460     int32_t i, length;
461     UErrorCode errorCode;
462     UBool overwrite, ok;
463 
464     log_verbose("\ntesting Trie '%s'\n", testName);
465     newTrie=utrie_open(NULL, NULL, 2000,
466                        checkRanges[0].value, checkRanges[0].value,
467                        latin1Linear);
468 
469     /* set values from setRanges[] */
470     ok=TRUE;
471     for(i=0; i<countSetRanges; ++i) {
472         start=setRanges[i].start;
473         limit=setRanges[i].limit;
474         value=setRanges[i].value;
475         overwrite=setRanges[i].overwrite;
476         if((limit-start)==1 && overwrite) {
477             ok&=utrie_set32(newTrie, start, value);
478         } else {
479             ok&=utrie_setRange32(newTrie, start, limit, value, overwrite);
480         }
481     }
482     if(!ok) {
483         log_err("error: setting values into a trie failed (%s)\n", testName);
484         return;
485     }
486 
487     /* verify that all these values are in the new Trie */
488     start=0;
489     for(i=0; i<countCheckRanges; ++i) {
490         limit=checkRanges[i].limit;
491         value=checkRanges[i].value;
492 
493         while(start<limit) {
494             if(value!=utrie_get32(newTrie, start, NULL)) {
495                 log_err("error: newTrie(%s)[U+%04lx]==0x%lx instead of 0x%lx\n",
496                         testName, start, utrie_get32(newTrie, start, NULL), value);
497             }
498             ++start;
499         }
500     }
501 
502     if(dataIs32) {
503         getFoldingOffset=_testFoldingOffset32;
504         getFoldedValue=_testFoldedValue32;
505     } else {
506         getFoldingOffset=_testFoldingOffset16;
507         getFoldedValue=_testFoldedValue16;
508     }
509 
510     /*
511      * code coverage for utrie.c/defaultGetFoldedValue(),
512      * pick some combination of parameters for selecting the UTrie defaults
513      */
514     if(!dataIs32 && latin1Linear) {
515         getFoldingOffset=NULL;
516         getFoldedValue=NULL;
517     }
518 
519     errorCode=U_ZERO_ERROR;
520     length=utrie_serialize(newTrie, storageHolder.storage, sizeof(storageHolder.storage),
521                            getFoldedValue,
522                            (UBool)!dataIs32,
523                            &errorCode);
524     if(U_FAILURE(errorCode)) {
525         log_err("error: utrie_serialize(%s) failed: %s\n", testName, u_errorName(errorCode));
526         utrie_close(newTrie);
527         return;
528     }
529     if (length >= (int32_t)sizeof(storageHolder.storage)) {
530         log_err("error: utrie_serialize(%s) needs more memory\n", testName);
531         utrie_close(newTrie);
532         return;
533     }
534 
535     /* test linear Latin-1 range from utrie_getData() */
536     if(latin1Linear) {
537         uint32_t *data;
538         int32_t dataLength;
539 
540         data=utrie_getData(newTrie, &dataLength);
541         start=0;
542         for(i=0; i<countCheckRanges && start<=0xff; ++i) {
543             limit=checkRanges[i].limit;
544             value=checkRanges[i].value;
545 
546             while(start<limit && start<=0xff) {
547                 if(value!=data[UTRIE_DATA_BLOCK_LENGTH+start]) {
548                     log_err("error: newTrie(%s).latin1Data[U+%04lx]==0x%lx instead of 0x%lx\n",
549                             testName, start, data[UTRIE_DATA_BLOCK_LENGTH+start], value);
550                 }
551                 ++start;
552             }
553         }
554     }
555 
556     utrie_close(newTrie);
557 
558     errorCode=U_ZERO_ERROR;
559     if(!utrie_unserialize(&trie, storageHolder.storage, length, &errorCode)) {
560         log_err("error: utrie_unserialize() failed, %s\n", u_errorName(errorCode));
561         return;
562     }
563     if(getFoldingOffset!=NULL) {
564         trie.getFoldingOffset=getFoldingOffset;
565     }
566 
567     if(dataIs32!=(trie.data32!=NULL)) {
568         log_err("error: trie serialization (%s) did not preserve 32-bitness\n", testName);
569     }
570     if(latin1Linear!=trie.isLatin1Linear) {
571         log_err("error: trie serialization (%s) did not preserve Latin-1-linearity\n", testName);
572     }
573 
574     /* verify that all these values are in the unserialized Trie */
575     start=0;
576     for(i=0; i<countCheckRanges; ++i) {
577         limit=checkRanges[i].limit;
578         value=checkRanges[i].value;
579 
580         if(start==0xd800) {
581             /* skip surrogates */
582             start=limit;
583             continue;
584         }
585 
586         while(start<limit) {
587             if(start<=0xffff) {
588                 if(dataIs32) {
589                     value2=UTRIE_GET32_FROM_BMP(&trie, start);
590                 } else {
591                     value2=UTRIE_GET16_FROM_BMP(&trie, start);
592                 }
593                 if(value!=value2) {
594                     log_err("error: unserialized trie(%s).fromBMP(U+%04lx)==0x%lx instead of 0x%lx\n",
595                             testName, start, value2, value);
596                 }
597                 if(!U16_IS_LEAD(start)) {
598                     if(dataIs32) {
599                         value2=UTRIE_GET32_FROM_LEAD(&trie, start);
600                     } else {
601                         value2=UTRIE_GET16_FROM_LEAD(&trie, start);
602                     }
603                     if(value!=value2) {
604                         log_err("error: unserialized trie(%s).fromLead(U+%04lx)==0x%lx instead of 0x%lx\n",
605                                 testName, start, value2, value);
606                     }
607                 }
608             }
609             if(dataIs32) {
610                 UTRIE_GET32(&trie, start, value2);
611             } else {
612                 UTRIE_GET16(&trie, start, value2);
613             }
614             if(value!=value2) {
615                 log_err("error: unserialized trie(%s).get(U+%04lx)==0x%lx instead of 0x%lx\n",
616                         testName, start, value2, value);
617             }
618             ++start;
619         }
620     }
621 
622     /* enumerate and verify all ranges */
623     enumRanges=checkRanges+1;
624     utrie_enum(&trie, _testEnumValue, _testEnumRange, &enumRanges);
625 
626     /* test linear Latin-1 range */
627     if(trie.isLatin1Linear) {
628         if(trie.data32!=NULL) {
629             const uint32_t *latin1=UTRIE_GET32_LATIN1(&trie);
630 
631             for(start=0; start<0x100; ++start) {
632                 if(latin1[start]!=UTRIE_GET32_FROM_LEAD(&trie, start)) {
633                     log_err("error: (%s) trie.latin1[U+%04lx]=0x%lx!=0x%lx=trie.get32(U+%04lx)\n",
634                             testName, start, latin1[start], UTRIE_GET32_FROM_LEAD(&trie, start), start);
635                 }
636             }
637         } else {
638             const uint16_t *latin1=UTRIE_GET16_LATIN1(&trie);
639 
640             for(start=0; start<0x100; ++start) {
641                 if(latin1[start]!=UTRIE_GET16_FROM_LEAD(&trie, start)) {
642                     log_err("error: (%s) trie.latin1[U+%04lx]=0x%lx!=0x%lx=trie.get16(U+%04lx)\n",
643                             testName, start, latin1[start], UTRIE_GET16_FROM_LEAD(&trie, start), start);
644                 }
645             }
646         }
647     }
648 
649     testTrieIteration(testName, &trie, checkRanges, countCheckRanges);
650 }
651 
652 static void
testTrieRanges2(const char * testName,const SetRange setRanges[],int32_t countSetRanges,const CheckRange checkRanges[],int32_t countCheckRanges,UBool dataIs32)653 testTrieRanges2(const char *testName,
654                 const SetRange setRanges[], int32_t countSetRanges,
655                 const CheckRange checkRanges[], int32_t countCheckRanges,
656                 UBool dataIs32) {
657     char name[40];
658 
659     testTrieRanges(testName,
660                    setRanges, countSetRanges,
661                    checkRanges, countCheckRanges,
662                    dataIs32, FALSE);
663     testTrieRangesWithMalloc(testName,
664                    setRanges, countSetRanges,
665                    checkRanges, countCheckRanges,
666                    dataIs32, FALSE);
667 
668     uprv_strcpy(name, testName);
669     uprv_strcat(name, "-latin1Linear");
670     testTrieRanges(name,
671                    setRanges, countSetRanges,
672                    checkRanges, countCheckRanges,
673                    dataIs32, TRUE);
674     testTrieRangesWithMalloc(name,
675                    setRanges, countSetRanges,
676                    checkRanges, countCheckRanges,
677                    dataIs32, TRUE);
678 }
679 
680 static void
testTrieRanges4(const char * testName,const SetRange setRanges[],int32_t countSetRanges,const CheckRange checkRanges[],int32_t countCheckRanges)681 testTrieRanges4(const char *testName,
682                 const SetRange setRanges[], int32_t countSetRanges,
683                 const CheckRange checkRanges[], int32_t countCheckRanges) {
684     char name[40];
685 
686     uprv_strcpy(name, testName);
687     uprv_strcat(name, ".32");
688     testTrieRanges2(name,
689                     setRanges, countSetRanges,
690                     checkRanges, countCheckRanges,
691                     TRUE);
692 
693     uprv_strcpy(name, testName);
694     uprv_strcat(name, ".16");
695     testTrieRanges2(name,
696                     setRanges, countSetRanges,
697                     checkRanges, countCheckRanges,
698                     FALSE);
699 }
700 
701 /* test data ----------------------------------------------------------------*/
702 
703 /* set consecutive ranges, even with value 0 */
704 static const SetRange
705 setRanges1[]={
706     {0,      0x20,       0,      FALSE},
707     {0x20,   0xa7,       0x1234, FALSE},
708     {0xa7,   0x3400,     0,      FALSE},
709     {0x3400, 0x9fa6,     0x6162, FALSE},
710     {0x9fa6, 0xda9e,     0x3132, FALSE},
711     {0xdada, 0xeeee,     0x87ff, FALSE}, /* try to disrupt _testFoldingOffset16() */
712     {0xeeee, 0x11111,    1,      FALSE},
713     {0x11111, 0x44444,   0x6162, FALSE},
714     {0x44444, 0x60003,   0,      FALSE},
715     {0xf0003, 0xf0004,   0xf,    FALSE},
716     {0xf0004, 0xf0006,   0x10,   FALSE},
717     {0xf0006, 0xf0007,   0x11,   FALSE},
718     {0xf0007, 0xf0020,   0x12,   FALSE},
719     {0xf0020, 0x110000,  0,      FALSE}
720 };
721 
722 static const CheckRange
723 checkRanges1[]={
724     {0,      0},      /* dummy start range to make _testEnumRange() simpler */
725     {0x20,   0},
726     {0xa7,   0x1234},
727     {0x3400, 0},
728     {0x9fa6, 0x6162},
729     {0xda9e, 0x3132},
730     {0xdada, 0},
731     {0xeeee, 0x87ff},
732     {0x11111,1},
733     {0x44444,0x6162},
734     {0xf0003,0},
735     {0xf0004,0xf},
736     {0xf0006,0x10},
737     {0xf0007,0x11},
738     {0xf0020,0x12},
739     {0x110000, 0}
740 };
741 
742 /* set some interesting overlapping ranges */
743 static const SetRange
744 setRanges2[]={
745     {0x21,   0x7f,       0x5555, TRUE},
746     {0x2f800,0x2fedc,    0x7a,   TRUE},
747     {0x72,   0xdd,       3,      TRUE},
748     {0xdd,   0xde,       4,      FALSE},
749     {0x201,  0x220,      6,      TRUE},  /* 3 consecutive blocks with the same pattern but discontiguous value ranges */
750     {0x221,  0x240,      6,      TRUE},
751     {0x241,  0x260,      6,      TRUE},
752     {0x2f987,0x2fa98,    5,      TRUE},
753     {0x2f777,0x2f833,    0,      TRUE},
754     {0x2f900,0x2ffee,    1,      FALSE},
755     {0x2ffee,0x2ffef,    2,      TRUE}
756 };
757 
758 static const CheckRange
759 checkRanges2[]={
760     {0,      0},      /* dummy start range to make _testEnumRange() simpler */
761     {0x21,   0},
762     {0x72,   0x5555},
763     {0xdd,   3},
764     {0xde,   4},
765     {0x201,  0},
766     {0x220,  6},
767     {0x221,  0},
768     {0x240,  6},
769     {0x241,  0},
770     {0x260,  6},
771     {0x2f833,0},
772     {0x2f987,0x7a},
773     {0x2fa98,5},
774     {0x2fedc,0x7a},
775     {0x2ffee,1},
776     {0x2ffef,2},
777     {0x110000, 0}
778 };
779 
780 /* use a non-zero initial value */
781 static const SetRange
782 setRanges3[]={
783     {0x31,   0xa4,   1,  FALSE},
784     {0x3400, 0x6789, 2,  FALSE},
785     {0x30000,0x34567,9,  TRUE},
786     {0x45678,0x56789,3,  TRUE}
787 };
788 
789 static const CheckRange
790 checkRanges3[]={
791     {0,      9},      /* dummy start range, also carries the initial value */
792     {0x31,   9},
793     {0xa4,   1},
794     {0x3400, 9},
795     {0x6789, 2},
796     {0x45678,9},
797     {0x56789,3},
798     {0x110000,9}
799 };
800 
801 static void
TrieTest(void)802 TrieTest(void) {
803     testTrieRanges4("set1",
804         setRanges1, UPRV_LENGTHOF(setRanges1),
805         checkRanges1, UPRV_LENGTHOF(checkRanges1));
806     testTrieRanges4("set2-overlap",
807         setRanges2, UPRV_LENGTHOF(setRanges2),
808         checkRanges2, UPRV_LENGTHOF(checkRanges2));
809     testTrieRanges4("set3-initial-9",
810         setRanges3, UPRV_LENGTHOF(setRanges3),
811         checkRanges3, UPRV_LENGTHOF(checkRanges3));
812 }
813 
814 /* test utrie_unserializeDummy() -------------------------------------------- */
815 
816 static int32_t U_CALLCONV
dummyGetFoldingOffset(uint32_t data)817 dummyGetFoldingOffset(uint32_t data) {
818     return -1; /* never get non-initialValue data for supplementary code points */
819 }
820 
821 static void
dummyTest(UBool make16BitTrie)822 dummyTest(UBool make16BitTrie) {
823     int32_t mem[UTRIE_DUMMY_SIZE/4];
824 
825     UTrie trie;
826     UErrorCode errorCode;
827     UChar32 c;
828 
829     uint32_t value, initialValue, leadUnitValue;
830 
831     if(make16BitTrie) {
832         initialValue=0x313;
833         leadUnitValue=0xaffe;
834     } else {
835         initialValue=0x01234567;
836         leadUnitValue=0x89abcdef;
837     }
838 
839     errorCode=U_ZERO_ERROR;
840     utrie_unserializeDummy(&trie, mem, sizeof(mem), initialValue, leadUnitValue, make16BitTrie, &errorCode);
841     if(U_FAILURE(errorCode)) {
842         log_err("utrie_unserializeDummy(make16BitTrie=%d) failed - %s\n", make16BitTrie, u_errorName(errorCode));
843         return;
844     }
845     trie.getFoldingOffset=dummyGetFoldingOffset;
846 
847     /* test that all code points have initialValue */
848     for(c=0; c<=0x10ffff; ++c) {
849         if(make16BitTrie) {
850             UTRIE_GET16(&trie, c, value);
851         } else {
852             UTRIE_GET32(&trie, c, value);
853         }
854         if(value!=initialValue) {
855             log_err("UTRIE_GET%s(dummy, U+%04lx)=0x%lx instead of 0x%lx\n",
856                 make16BitTrie ? "16" : "32", (long)c, (long)value, (long)initialValue);
857         }
858     }
859 
860     /* test that the lead surrogate code units have leadUnitValue */
861     for(c=0xd800; c<=0xdbff; ++c) {
862         if(make16BitTrie) {
863             value=UTRIE_GET16_FROM_LEAD(&trie, c);
864         } else {
865             value=UTRIE_GET32_FROM_LEAD(&trie, c);
866         }
867         if(value!=leadUnitValue) {
868             log_err("UTRIE_GET%s_FROM_LEAD(dummy, U+%04lx)=0x%lx instead of 0x%lx\n",
869                 make16BitTrie ? "16" : "32", (long)c, (long)value, (long)leadUnitValue);
870         }
871     }
872 }
873 
874 static void
DummyTrieTest(void)875 DummyTrieTest(void) {
876     dummyTest(TRUE);
877     dummyTest(FALSE);
878 }
879 
880 void
881 addTrieTest(TestNode** root);
882 
883 void
addTrieTest(TestNode ** root)884 addTrieTest(TestNode** root) {
885     addTest(root, &TrieTest, "tsutil/trietest/TrieTest");
886     addTest(root, &DummyTrieTest, "tsutil/trietest/DummyTrieTest");
887 }
888