1 /********************************************************************
2  * COPYRIGHT:
3  * Copyright (c) 1997-2014, International Business Machines Corporation and
4  * others. All Rights Reserved.
5  ********************************************************************/
6 /*******************************************************************************
7 *
8 * File CALLCOLL.C
9 *
10 * Modification History:
11 *        Name                     Description
12 *     Madhu Katragadda              Ported for C API
13 ********************************************************************************
14 */
15 
16 /*
17  * Important: This file is included into intltest/allcoll.cpp so that the
18  * test data is shared. This makes it easier to maintain the test data,
19  * especially since the Unicode data must be portable and quoted character
20  * literals will not work.
21  * If it is included, then there will be a #define INCLUDE_CALLCOLL_C
22  * that must prevent the actual code in here from being part of the
23  * allcoll.cpp compilation.
24  */
25 
26 /**
27  * CollationDummyTest is a third level test class.  This tests creation of
28  * a customized collator object.  For example, number 1 to be sorted
29  * equlivalent to word 'one'.
30  */
31 
32 #include <string.h>
33 #include <stdlib.h>
34 
35 #include "unicode/utypes.h"
36 
37 #if !UCONFIG_NO_COLLATION
38 
39 #include "unicode/ucol.h"
40 #include "unicode/uloc.h"
41 #include "unicode/ures.h"
42 #include "unicode/udata.h"
43 #include "unicode/ucoleitr.h"
44 #include "unicode/ustring.h"
45 #include "unicode/uclean.h"
46 #include "unicode/putil.h"
47 #include "unicode/uenum.h"
48 
49 #include "cintltst.h"
50 #include "ccolltst.h"
51 #include "callcoll.h"
52 #include "calldata.h"
53 #include "cstring.h"
54 #include "cmemory.h"
55 
56 /* set to 1 to test offsets in backAndForth() */
57 #define TEST_OFFSETS 0
58 
59 /* perform test with strength PRIMARY */
60 static void TestPrimary(void);
61 
62 /* perform test with strength SECONDARY */
63 static void TestSecondary(void);
64 
65 /* perform test with strength tertiary */
66 static void TestTertiary(void);
67 
68 /*perform tests with strength Identical */
69 static void TestIdentical(void);
70 
71 /* perform extra tests */
72 static void TestExtra(void);
73 
74 /* Test jitterbug 581 */
75 static void TestJB581(void);
76 
77 /* Test jitterbug 1401 */
78 static void TestJB1401(void);
79 
80 /* Test [variable top] in the rule syntax */
81 static void TestVariableTop(void);
82 
83 /* Test surrogates */
84 static void TestSurrogates(void);
85 
86 static void TestInvalidRules(void);
87 
88 static void TestJitterbug1098(void);
89 
90 static void TestFCDCrash(void);
91 
92 static void TestJ5298(void);
93 
94 const UCollationResult results[] = {
95     UCOL_LESS,
96     UCOL_LESS, /*UCOL_GREATER,*/
97     UCOL_LESS,
98     UCOL_LESS,
99     UCOL_LESS,
100     UCOL_LESS,
101     UCOL_LESS,
102     UCOL_GREATER,
103     UCOL_GREATER,
104     UCOL_LESS,                                     /*  10 */
105     UCOL_GREATER,
106     UCOL_LESS,
107     UCOL_GREATER,
108     UCOL_GREATER,
109     UCOL_LESS,
110     UCOL_LESS,
111     UCOL_LESS,
112     /*  test primary > 17 */
113     UCOL_EQUAL,
114     UCOL_EQUAL,
115     UCOL_EQUAL,                                    /*  20 */
116     UCOL_LESS,
117     UCOL_LESS,
118     UCOL_EQUAL,
119     UCOL_EQUAL,
120     UCOL_EQUAL,
121     UCOL_LESS,
122     /*  test secondary > 26 */
123     UCOL_EQUAL,
124     UCOL_EQUAL,
125     UCOL_EQUAL,
126     UCOL_EQUAL,
127     UCOL_EQUAL,                                    /*  30 */
128     UCOL_EQUAL,
129     UCOL_LESS,
130     UCOL_EQUAL,                                     /*  34 */
131     UCOL_EQUAL,
132     UCOL_EQUAL,
133     UCOL_LESS                                        /* 37 */
134 };
135 
136 
137 static
uprv_appendByteToHexString(char * dst,uint8_t val)138 void uprv_appendByteToHexString(char *dst, uint8_t val) {
139   uint32_t len = (uint32_t)uprv_strlen(dst);
140   *(dst+len) = T_CString_itosOffset((val >> 4));
141   *(dst+len+1) = T_CString_itosOffset((val & 0xF));
142   *(dst+len+2) = 0;
143 }
144 
145 /* this function makes a string with representation of a sortkey */
sortKeyToString(const UCollator * coll,const uint8_t * sortkey,char * buffer,uint32_t * len)146 static char* U_EXPORT2 sortKeyToString(const UCollator *coll, const uint8_t *sortkey, char *buffer, uint32_t *len) {
147     int32_t strength = UCOL_PRIMARY;
148     uint32_t res_size = 0;
149     UBool doneCase = FALSE;
150     UErrorCode errorCode = U_ZERO_ERROR;
151 
152     char *current = buffer;
153     const uint8_t *currentSk = sortkey;
154 
155     uprv_strcpy(current, "[");
156 
157     while(strength <= UCOL_QUATERNARY && strength <= ucol_getStrength(coll)) {
158         if(strength > UCOL_PRIMARY) {
159             uprv_strcat(current, " . ");
160         }
161         while(*currentSk != 0x01 && *currentSk != 0x00) { /* print a level */
162             uprv_appendByteToHexString(current, *currentSk++);
163             uprv_strcat(current, " ");
164         }
165         if(ucol_getAttribute(coll, UCOL_CASE_LEVEL, &errorCode) == UCOL_ON && strength == UCOL_SECONDARY && doneCase == FALSE) {
166             doneCase = TRUE;
167         } else if(ucol_getAttribute(coll, UCOL_CASE_LEVEL, &errorCode) == UCOL_OFF || doneCase == TRUE || strength != UCOL_SECONDARY) {
168             strength ++;
169         }
170         if (*currentSk) {
171             uprv_appendByteToHexString(current, *currentSk++); /* This should print '01' */
172         }
173         if(strength == UCOL_QUATERNARY && ucol_getAttribute(coll, UCOL_ALTERNATE_HANDLING, &errorCode) == UCOL_NON_IGNORABLE) {
174             break;
175         }
176     }
177 
178     if(ucol_getStrength(coll) == UCOL_IDENTICAL) {
179         uprv_strcat(current, " . ");
180         while(*currentSk != 0) {
181             uprv_appendByteToHexString(current, *currentSk++);
182             uprv_strcat(current, " ");
183         }
184 
185         uprv_appendByteToHexString(current, *currentSk++);
186     }
187     uprv_strcat(current, "]");
188 
189     if(res_size > *len) {
190         return NULL;
191     }
192 
193     return buffer;
194 }
195 
addAllCollTest(TestNode ** root)196 void addAllCollTest(TestNode** root)
197 {
198     addTest(root, &TestPrimary, "tscoll/callcoll/TestPrimary");
199     addTest(root, &TestSecondary, "tscoll/callcoll/TestSecondary");
200     addTest(root, &TestTertiary, "tscoll/callcoll/TestTertiary");
201     addTest(root, &TestIdentical, "tscoll/callcoll/TestIdentical");
202     addTest(root, &TestExtra, "tscoll/callcoll/TestExtra");
203     addTest(root, &TestJB581, "tscoll/callcoll/TestJB581");
204     addTest(root, &TestVariableTop, "tscoll/callcoll/TestVariableTop");
205     addTest(root, &TestSurrogates, "tscoll/callcoll/TestSurrogates");
206     addTest(root, &TestInvalidRules, "tscoll/callcoll/TestInvalidRules");
207     addTest(root, &TestJB1401, "tscoll/callcoll/TestJB1401");
208     addTest(root, &TestJitterbug1098, "tscoll/callcoll/TestJitterbug1098");
209     addTest(root, &TestFCDCrash, "tscoll/callcoll/TestFCDCrash");
210     addTest(root, &TestJ5298, "tscoll/callcoll/TestJ5298");
211 }
212 
hasCollationElements(const char * locName)213 UBool hasCollationElements(const char *locName) {
214 
215   UErrorCode status = U_ZERO_ERROR;
216 
217   UResourceBundle *loc = ures_open(U_ICUDATA_NAME U_TREE_SEPARATOR_STRING "coll", locName, &status);;
218 
219   if(U_SUCCESS(status)) {
220     status = U_ZERO_ERROR;
221     loc = ures_getByKey(loc, "collations", loc, &status);
222     ures_close(loc);
223     if(status == U_ZERO_ERROR) { /* do the test - there are real elements */
224       return TRUE;
225     }
226   }
227   return FALSE;
228 }
229 
compareUsingPartials(UCollator * coll,const UChar source[],int32_t sLen,const UChar target[],int32_t tLen,int32_t pieceSize,UErrorCode * status)230 static UCollationResult compareUsingPartials(UCollator *coll, const UChar source[], int32_t sLen, const UChar target[], int32_t tLen, int32_t pieceSize, UErrorCode *status) {
231   int32_t partialSKResult = 0;
232   UCharIterator sIter, tIter;
233   uint32_t sState[2], tState[2];
234   int32_t sSize = pieceSize, tSize = pieceSize;
235   /*int32_t i = 0;*/
236   uint8_t sBuf[16384], tBuf[16384];
237   if(pieceSize > 16384) {
238     log_err("Partial sortkey size buffer too small. Please consider increasing the buffer!\n");
239     *status = U_BUFFER_OVERFLOW_ERROR;
240     return UCOL_EQUAL;
241   }
242   *status = U_ZERO_ERROR;
243   sState[0] = 0; sState[1] = 0;
244   tState[0] = 0; tState[1] = 0;
245   while(sSize == pieceSize && tSize == pieceSize && partialSKResult == 0) {
246     uiter_setString(&sIter, source, sLen);
247     uiter_setString(&tIter, target, tLen);
248     sSize = ucol_nextSortKeyPart(coll, &sIter, sState, sBuf, pieceSize, status);
249     tSize = ucol_nextSortKeyPart(coll, &tIter, tState, tBuf, pieceSize, status);
250 
251     if(sState[0] != 0 || tState[0] != 0) {
252       /*log_verbose("State != 0 : %08X %08X\n", sState[0], tState[0]);*/
253     }
254     /*log_verbose("%i ", i++);*/
255 
256     partialSKResult = memcmp(sBuf, tBuf, pieceSize);
257   }
258 
259   if(partialSKResult < 0) {
260       return UCOL_LESS;
261   } else if(partialSKResult > 0) {
262     return UCOL_GREATER;
263   } else {
264     return UCOL_EQUAL;
265   }
266 }
267 
doTestVariant(UCollator * myCollation,const UChar source[],const UChar target[],UCollationResult result)268 static void doTestVariant(UCollator* myCollation, const UChar source[], const UChar target[], UCollationResult result)
269 {
270     int32_t sortklen1, sortklen2, sortklenmax, sortklenmin;
271     int temp=0, gSortklen1=0,gSortklen2=0;
272     UCollationResult compareResult, compareResulta, keyResult, compareResultIter = result;
273     uint8_t *sortKey1, *sortKey2, *sortKey1a, *sortKey2a;
274     uint32_t sLen = u_strlen(source);
275     uint32_t tLen = u_strlen(target);
276     char buffer[256];
277     uint32_t len;
278     UErrorCode status = U_ZERO_ERROR;
279     UColAttributeValue norm = ucol_getAttribute(myCollation, UCOL_NORMALIZATION_MODE, &status);
280 
281     UCharIterator sIter, tIter;
282 
283     compareResult  = ucol_strcoll(myCollation, source, sLen, target, tLen);
284     if (compareResult != result) {
285         log_err("ucol_strcoll with explicit length returned wrong result (%i exp. %i): %s, %s\n",
286             compareResult, result, aescstrdup(source,-1), aescstrdup(target,-1));
287     }
288     compareResulta = ucol_strcoll(myCollation, source, -1,   target, -1);
289     if (compareResulta != result) {
290         log_err("ucol_strcoll with null terminated strings returned wrong result (%i exp. %i): %s, %s\n",
291             compareResult, result, aescstrdup(source,-1), aescstrdup(target,-1));
292     }
293 
294     uiter_setString(&sIter, source, sLen);
295     uiter_setString(&tIter, target, tLen);
296     compareResultIter = ucol_strcollIter(myCollation, &sIter, &tIter, &status);
297     if(compareResultIter != result) {
298         log_err("different results in iterative comparison for UTF-16 encoded strings. %s, %s\n", aescstrdup(source,-1), aescstrdup(target,-1));
299     }
300 
301     /* convert the strings to UTF-8 and do try comparing with char iterator and ucol_strcollUTF8 */
302     {
303         char utf8Source[256], utf8Target[256];
304         int32_t utf8SourceLen = 0, utf8TargetLen = 0;
305 
306         u_strToUTF8(utf8Source, 256, &utf8SourceLen, source, sLen, &status);
307         if(U_FAILURE(status)) { /* probably buffer is not big enough */
308             log_verbose("Src UTF-8 buffer too small! Will not compare!\n");
309         } else {
310             u_strToUTF8(utf8Target, 256, &utf8TargetLen, target, tLen, &status);
311             if(U_SUCCESS(status)) {
312                 {
313                     /* ucol_strcollUTF8 */
314                     compareResulta = ucol_strcollUTF8(myCollation, utf8Source, utf8SourceLen, utf8Target, utf8TargetLen, &status);
315                     if (U_FAILURE(status)) {
316                         log_err("Error in ucol_strcollUTF8 with explicit length\n");
317                         status = U_ZERO_ERROR;
318                     } else if (compareResulta != result) {
319                         log_err("ucol_strcollUTF8 with explicit length returned wrong result (%i exp. %i): %s, %s\n",
320                             compareResulta, result, aescstrdup(source,-1), aescstrdup(target,-1));
321                     }
322                     compareResulta = ucol_strcollUTF8(myCollation, utf8Source, -1, utf8Target, -1, &status);
323                     if (U_FAILURE(status)) {
324                         log_err("Error in ucol_strcollUTF8 with null terminated strings\n");
325                         status = U_ZERO_ERROR;
326                     } else if (compareResulta != result) {
327                         log_err("ucol_strcollUTF8 with null terminated strings returned wrong result (%i exp. %i): %s, %s\n",
328                             compareResulta, result, aescstrdup(source,-1), aescstrdup(target,-1));
329                     }
330                 }
331 
332                 {
333                     /* char iterator over UTF8 */
334                     UCollationResult compareResultUTF8Iter = result, compareResultUTF8IterNorm = result;
335 
336                     uiter_setUTF8(&sIter, utf8Source, utf8SourceLen);
337                     uiter_setUTF8(&tIter, utf8Target, utf8TargetLen);
338                     compareResultUTF8Iter = ucol_strcollIter(myCollation, &sIter, &tIter, &status);
339 
340                     ucol_setAttribute(myCollation, UCOL_NORMALIZATION_MODE, UCOL_ON, &status);
341                     sIter.move(&sIter, 0, UITER_START);
342                     tIter.move(&tIter, 0, UITER_START);
343                     compareResultUTF8IterNorm = ucol_strcollIter(myCollation, &sIter, &tIter, &status);
344 
345                     ucol_setAttribute(myCollation, UCOL_NORMALIZATION_MODE, norm, &status);
346                     if(compareResultUTF8Iter != compareResultIter) {
347                         log_err("different results in iterative comparison for UTF-16 and UTF-8 encoded strings. %s, %s\n", aescstrdup(source,-1), aescstrdup(target,-1));
348                     }
349                     if(compareResultUTF8Iter != compareResultUTF8IterNorm) {
350                         log_err("different results in iterative when normalization is turned on with UTF-8 strings. %s, %s\n", aescstrdup(source,-1), aescstrdup(target,-1));
351                     }
352                 }
353             } else {
354                 log_verbose("Target UTF-8 buffer too small! Did not compare!\n");
355             }
356             if(U_FAILURE(status)) {
357                 log_verbose("UTF-8 strcoll failed! Ignoring result\n");
358             }
359         }
360     }
361 
362     /* testing the partial sortkeys */
363     if(1) { /*!QUICK*/
364       int32_t i = 0;
365       int32_t partialSizes[] = { 3, 1, 2, 4, 8, 20, 80 }; /* just size 3 in the quick mode */
366       int32_t partialSizesSize = 1;
367       if(getTestOption(QUICK_OPTION) <= 0) {
368         partialSizesSize = 7;
369       }
370       /*log_verbose("partial sortkey test piecesize=");*/
371       for(i = 0; i < partialSizesSize; i++) {
372         UCollationResult partialSKResult = result, partialNormalizedSKResult = result;
373         /*log_verbose("%i ", partialSizes[i]);*/
374 
375         partialSKResult = compareUsingPartials(myCollation, source, sLen, target, tLen, partialSizes[i], &status);
376         if(partialSKResult != result) {
377           log_err("Partial sortkey comparison returned wrong result (%i exp. %i): %s, %s (size %i)\n",
378             partialSKResult, result,
379             aescstrdup(source,-1), aescstrdup(target,-1), partialSizes[i]);
380         }
381 
382         if(getTestOption(QUICK_OPTION) <= 0 && norm != UCOL_ON) {
383           /*log_verbose("N ");*/
384           ucol_setAttribute(myCollation, UCOL_NORMALIZATION_MODE, UCOL_ON, &status);
385           partialNormalizedSKResult = compareUsingPartials(myCollation, source, sLen, target, tLen, partialSizes[i], &status);
386           ucol_setAttribute(myCollation, UCOL_NORMALIZATION_MODE, norm, &status);
387           if(partialSKResult != partialNormalizedSKResult) {
388             log_err("Partial sortkey comparison gets different result when normalization is on: %s, %s (size %i)\n",
389               aescstrdup(source,-1), aescstrdup(target,-1), partialSizes[i]);
390           }
391         }
392       }
393       /*log_verbose("\n");*/
394     }
395 
396     sortklen1=ucol_getSortKey(myCollation, source, sLen,  NULL, 0);
397     sortklen2=ucol_getSortKey(myCollation, target, tLen,  NULL, 0);
398 
399     sortklenmax = (sortklen1>sortklen2?sortklen1:sortklen2);
400     sortklenmin = (sortklen1<sortklen2?sortklen1:sortklen2);
401     (void)sortklenmin;  /* Suppress set but not used warning. */
402 
403     sortKey1 =(uint8_t*)malloc(sizeof(uint8_t) * (sortklenmax+1));
404     sortKey1a=(uint8_t*)malloc(sizeof(uint8_t) * (sortklenmax+1));
405     ucol_getSortKey(myCollation, source, sLen, sortKey1,  sortklen1+1);
406     ucol_getSortKey(myCollation, source, -1,   sortKey1a, sortklen1+1);
407 
408     sortKey2 =(uint8_t*)malloc(sizeof(uint8_t) * (sortklenmax+1));
409     sortKey2a=(uint8_t*)malloc(sizeof(uint8_t) * (sortklenmax+1));
410     ucol_getSortKey(myCollation, target, tLen, sortKey2,  sortklen2+1);
411     ucol_getSortKey(myCollation, target, -1,   sortKey2a, sortklen2+1);
412 
413     /* Check that sort key generated with null terminated string is identical  */
414     /*  to that generted with a length specified.                              */
415     if (uprv_strcmp((const char *)sortKey1, (const char *)sortKey1a) != 0 ||
416         uprv_strcmp((const char *)sortKey2, (const char *)sortKey2a) != 0 ) {
417         log_err("Sort Keys from null terminated and explicit length strings differ.\n");
418     }
419 
420     /*memcmp(sortKey1, sortKey2,sortklenmax);*/
421     temp= uprv_strcmp((const char *)sortKey1, (const char *)sortKey2);
422     gSortklen1 = uprv_strlen((const char *)sortKey1)+1;
423     gSortklen2 = uprv_strlen((const char *)sortKey2)+1;
424     if(sortklen1 != gSortklen1){
425         log_err("SortKey length does not match Expected: %i Got: %i\n",sortklen1, gSortklen1);
426         log_verbose("Generated sortkey: %s\n", sortKeyToString(myCollation, sortKey1, buffer, &len));
427     }
428     if(sortklen2!= gSortklen2){
429         log_err("SortKey length does not match Expected: %i Got: %i\n", sortklen2, gSortklen2);
430         log_verbose("Generated sortkey: %s\n", sortKeyToString(myCollation, sortKey2, buffer, &len));
431     }
432 
433     if(temp < 0) {
434         keyResult=UCOL_LESS;
435     }
436     else if(temp > 0) {
437         keyResult= UCOL_GREATER;
438     }
439     else {
440         keyResult = UCOL_EQUAL;
441     }
442     reportCResult( source, target, sortKey1, sortKey2, compareResult, keyResult, compareResultIter, result );
443     free(sortKey1);
444     free(sortKey2);
445     free(sortKey1a);
446     free(sortKey2a);
447 
448 }
449 
doTest(UCollator * myCollation,const UChar source[],const UChar target[],UCollationResult result)450 void doTest(UCollator* myCollation, const UChar source[], const UChar target[], UCollationResult result)
451 {
452   if(myCollation) {
453     doTestVariant(myCollation, source, target, result);
454     if(result == UCOL_LESS) {
455       doTestVariant(myCollation, target, source, UCOL_GREATER);
456     } else if(result == UCOL_GREATER) {
457       doTestVariant(myCollation, target, source, UCOL_LESS);
458     } else {
459       doTestVariant(myCollation, target, source, UCOL_EQUAL);
460     }
461   } else {
462     log_data_err("No collator! Any data around?\n");
463   }
464 }
465 
466 
467 /**
468  * Return an integer array containing all of the collation orders
469  * returned by calls to next on the specified iterator
470  */
getOrders(UCollationElements * iter,int32_t * orderLength)471 OrderAndOffset* getOrders(UCollationElements *iter, int32_t *orderLength)
472 {
473     UErrorCode status;
474     int32_t order;
475     int32_t maxSize = 100;
476     int32_t size = 0;
477     int32_t offset = ucol_getOffset(iter);
478     OrderAndOffset *temp;
479     OrderAndOffset *orders =(OrderAndOffset *)malloc(sizeof(OrderAndOffset) * maxSize);
480     status= U_ZERO_ERROR;
481 
482 
483     while ((order=ucol_next(iter, &status)) != UCOL_NULLORDER)
484     {
485         if (size == maxSize)
486         {
487             maxSize *= 2;
488             temp = (OrderAndOffset *)malloc(sizeof(OrderAndOffset) * maxSize);
489 
490             memcpy(temp, orders, size * sizeof(OrderAndOffset));
491             free(orders);
492             orders = temp;
493 
494         }
495 
496         orders[size].order  = order;
497         orders[size].offset = offset;
498 
499         offset = ucol_getOffset(iter);
500         size += 1;
501     }
502 
503     if (maxSize > size && size > 0)
504     {
505         temp = (OrderAndOffset *)malloc(sizeof(OrderAndOffset) * size);
506 
507         memcpy(temp, orders, size * sizeof(OrderAndOffset));
508         free(orders);
509         orders = temp;
510 
511 
512     }
513 
514     *orderLength = size;
515     return orders;
516 }
517 
518 
519 void
backAndForth(UCollationElements * iter)520 backAndForth(UCollationElements *iter)
521 {
522     /* Run through the iterator forwards and stick it into an array */
523     int32_t idx, o;
524     UErrorCode status = U_ZERO_ERROR;
525     int32_t orderLength = 0;
526     OrderAndOffset *orders = getOrders(iter, &orderLength);
527 
528 
529     /* Now go through it backwards and make sure we get the same values */
530     idx = orderLength;
531     ucol_reset(iter);
532 
533     /* synwee : changed */
534     while ((o = ucol_previous(iter, &status)) != UCOL_NULLORDER) {
535 #if TEST_OFFSETS
536       int32_t offset =
537 #endif
538         ucol_getOffset(iter);
539 
540       idx -= 1;
541       if (o != orders[idx].order) {
542         if (o == 0)
543           idx ++;
544         else {
545           while (idx > 0 && orders[-- idx].order == 0) {
546             /* nothing... */
547           }
548 
549           if (o != orders[idx].order) {
550               log_err("Mismatched order at index %d: 0x%8.8X vs. 0x%8.8X\n", idx,
551                 orders[idx].order, o);
552             goto bail;
553           }
554         }
555       }
556 
557 #if TEST_OFFSETS
558       if (offset != orders[idx].offset) {
559         log_err("Mismatched offset at index %d: %d vs. %d\n", idx,
560             orders[idx].offset, offset);
561         goto bail;
562       }
563 #endif
564 
565     }
566 
567     while (idx != 0 && orders[idx - 1].order == 0) {
568       idx -= 1;
569     }
570 
571     if (idx != 0) {
572         log_err("Didn't get back to beginning - index is %d\n", idx);
573 
574         ucol_reset(iter);
575         log_err("\nnext: ");
576 
577         if ((o = ucol_next(iter, &status)) != UCOL_NULLORDER) {
578             log_err("Error at %x\n", o);
579         }
580 
581         log_err("\nprev: ");
582 
583         if ((o = ucol_previous(iter, &status)) != UCOL_NULLORDER) {
584             log_err("Error at %x\n", o);
585         }
586 
587         log_verbose("\n");
588     }
589 
590 bail:
591     free(orders);
592 }
593 
genericOrderingTestWithResult(UCollator * coll,const char * const s[],uint32_t size,UCollationResult result)594 void genericOrderingTestWithResult(UCollator *coll, const char * const s[], uint32_t size, UCollationResult result) {
595   UChar t1[2048] = {0};
596   UChar t2[2048] = {0};
597   UCollationElements *iter;
598   UErrorCode status = U_ZERO_ERROR;
599 
600   uint32_t i = 0, j = 0;
601   log_verbose("testing sequence:\n");
602   for(i = 0; i < size; i++) {
603     log_verbose("%s\n", s[i]);
604   }
605 
606   iter = ucol_openElements(coll, t1, u_strlen(t1), &status);
607   if (U_FAILURE(status)) {
608     log_err("Creation of iterator failed\n");
609   }
610   for(i = 0; i < size-1; i++) {
611     for(j = i+1; j < size; j++) {
612       u_unescape(s[i], t1, 2048);
613       u_unescape(s[j], t2, 2048);
614       doTest(coll, t1, t2, result);
615       /* synwee : added collation element iterator test */
616       ucol_setText(iter, t1, u_strlen(t1), &status);
617       backAndForth(iter);
618       ucol_setText(iter, t2, u_strlen(t2), &status);
619       backAndForth(iter);
620     }
621   }
622   ucol_closeElements(iter);
623 }
624 
genericOrderingTest(UCollator * coll,const char * const s[],uint32_t size)625 void genericOrderingTest(UCollator *coll, const char * const s[], uint32_t size) {
626   genericOrderingTestWithResult(coll, s, size, UCOL_LESS);
627 }
628 
genericLocaleStarter(const char * locale,const char * const s[],uint32_t size)629 void genericLocaleStarter(const char *locale, const char * const s[], uint32_t size) {
630   UErrorCode status = U_ZERO_ERROR;
631   UCollator *coll = ucol_open(locale, &status);
632 
633   log_verbose("Locale starter for %s\n", locale);
634 
635   if(U_SUCCESS(status)) {
636     genericOrderingTest(coll, s, size);
637   } else if(status == U_FILE_ACCESS_ERROR) {
638     log_data_err("Is your data around?\n");
639     return;
640   } else {
641     log_err("Unable to open collator for locale %s\n", locale);
642   }
643   ucol_close(coll);
644 }
645 
genericLocaleStarterWithResult(const char * locale,const char * const s[],uint32_t size,UCollationResult result)646 void genericLocaleStarterWithResult(const char *locale, const char * const s[], uint32_t size, UCollationResult result) {
647   UErrorCode status = U_ZERO_ERROR;
648   UCollator *coll = ucol_open(locale, &status);
649 
650   log_verbose("Locale starter for %s\n", locale);
651 
652   if(U_SUCCESS(status)) {
653     genericOrderingTestWithResult(coll, s, size, result);
654   } else if(status == U_FILE_ACCESS_ERROR) {
655     log_data_err("Is your data around?\n");
656     return;
657   } else {
658     log_err("Unable to open collator for locale %s\n", locale);
659   }
660   ucol_close(coll);
661 }
662 
663 /* currently not used with options */
genericRulesStarterWithOptionsAndResult(const char * rules,const char * const s[],uint32_t size,const UColAttribute * attrs,const UColAttributeValue * values,uint32_t attsize,UCollationResult result)664 void genericRulesStarterWithOptionsAndResult(const char *rules, const char * const s[], uint32_t size, const UColAttribute *attrs, const UColAttributeValue *values, uint32_t attsize, UCollationResult result) {
665   UErrorCode status = U_ZERO_ERROR;
666   UChar rlz[RULE_BUFFER_LEN] = { 0 };
667   uint32_t rlen = u_unescape(rules, rlz, RULE_BUFFER_LEN);
668   uint32_t i;
669 
670   UCollator *coll = ucol_openRules(rlz, rlen, UCOL_DEFAULT, UCOL_DEFAULT,NULL, &status);
671 
672   log_verbose("Rules starter for %s\n", rules);
673 
674   if(U_SUCCESS(status)) {
675     log_verbose("Setting attributes\n");
676     for(i = 0; i < attsize; i++) {
677       ucol_setAttribute(coll, attrs[i], values[i], &status);
678     }
679 
680     genericOrderingTestWithResult(coll, s, size, result);
681   } else {
682     log_err_status(status, "Unable to open collator with rules %s\n", rules);
683   }
684   ucol_close(coll);
685 }
686 
genericLocaleStarterWithOptionsAndResult(const char * locale,const char * const s[],uint32_t size,const UColAttribute * attrs,const UColAttributeValue * values,uint32_t attsize,UCollationResult result)687 void genericLocaleStarterWithOptionsAndResult(const char *locale, const char * const s[], uint32_t size, const UColAttribute *attrs, const UColAttributeValue *values, uint32_t attsize, UCollationResult result) {
688   UErrorCode status = U_ZERO_ERROR;
689   uint32_t i;
690 
691   UCollator *coll = ucol_open(locale, &status);
692 
693   log_verbose("Locale starter for %s\n", locale);
694 
695   if(U_SUCCESS(status)) {
696 
697     log_verbose("Setting attributes\n");
698     for(i = 0; i < attsize; i++) {
699       ucol_setAttribute(coll, attrs[i], values[i], &status);
700     }
701 
702     genericOrderingTestWithResult(coll, s, size, result);
703   } else {
704     log_err_status(status, "Unable to open collator for locale %s\n", locale);
705   }
706   ucol_close(coll);
707 }
708 
genericLocaleStarterWithOptions(const char * locale,const char * const s[],uint32_t size,const UColAttribute * attrs,const UColAttributeValue * values,uint32_t attsize)709 void genericLocaleStarterWithOptions(const char *locale, const char * const s[], uint32_t size, const UColAttribute *attrs, const UColAttributeValue *values, uint32_t attsize) {
710   genericLocaleStarterWithOptionsAndResult(locale, s, size, attrs, values, attsize, UCOL_LESS);
711 }
712 
genericRulesStarterWithResult(const char * rules,const char * const s[],uint32_t size,UCollationResult result)713 void genericRulesStarterWithResult(const char *rules, const char * const s[], uint32_t size, UCollationResult result) {
714   UErrorCode status = U_ZERO_ERROR;
715   UChar rlz[RULE_BUFFER_LEN] = { 0 };
716   uint32_t rlen = u_unescape(rules, rlz, RULE_BUFFER_LEN);
717 
718   UCollator *coll = NULL;
719   coll = ucol_openRules(rlz, rlen, UCOL_DEFAULT, UCOL_DEFAULT,NULL, &status);
720   log_verbose("Rules starter for %s\n", rules);
721 
722   if(U_SUCCESS(status)) {
723     genericOrderingTestWithResult(coll, s, size, result);
724     ucol_close(coll);
725   } else if(status == U_FILE_ACCESS_ERROR) {
726     log_data_err("Is your data around?\n");
727   } else {
728     log_err("Unable to open collator with rules %s\n", rules);
729   }
730 }
731 
genericRulesStarter(const char * rules,const char * const s[],uint32_t size)732 void genericRulesStarter(const char *rules, const char * const s[], uint32_t size) {
733   genericRulesStarterWithResult(rules, s, size, UCOL_LESS);
734 }
735 
TestTertiary()736 static void TestTertiary()
737 {
738     int32_t len,i;
739     UCollator *myCollation;
740     UErrorCode status=U_ZERO_ERROR;
741     static const char str[]="& C < ch, cH, Ch, CH & Five, 5 & Four, 4 & one, 1 & Ampersand; '&' & Two, 2 ";
742     UChar rules[sizeof(str)];
743     len = strlen(str);
744     u_uastrcpy(rules, str);
745 
746     myCollation=ucol_openRules(rules, len, UCOL_OFF, UCOL_DEFAULT_STRENGTH, NULL, &status);
747     if(U_FAILURE(status)){
748         log_err_status(status, "ERROR: in creation of rule based collator :%s\n", myErrorName(status));
749         return;
750     }
751 
752     ucol_setStrength(myCollation, UCOL_TERTIARY);
753     for (i = 0; i < 17 ; i++)
754     {
755         doTest(myCollation, testSourceCases[i], testTargetCases[i], results[i]);
756     }
757     ucol_close(myCollation);
758     myCollation = 0;
759 }
760 
TestPrimary()761 static void TestPrimary( )
762 {
763     int32_t len,i;
764     UCollator *myCollation;
765     UErrorCode status=U_ZERO_ERROR;
766     static const char str[]="& C < ch, cH, Ch, CH & Five, 5 & Four, 4 & one, 1 & Ampersand; '&' & Two, 2 ";
767     UChar rules[sizeof(str)];
768     len = strlen(str);
769     u_uastrcpy(rules, str);
770 
771     myCollation=ucol_openRules(rules, len, UCOL_OFF, UCOL_DEFAULT_STRENGTH,NULL, &status);
772     if(U_FAILURE(status)){
773         log_err_status(status, "ERROR: in creation of rule based collator :%s\n", myErrorName(status));
774         return;
775     }
776     ucol_setStrength(myCollation, UCOL_PRIMARY);
777 
778     for (i = 17; i < 26 ; i++)
779     {
780 
781         doTest(myCollation, testSourceCases[i], testTargetCases[i], results[i]);
782     }
783     ucol_close(myCollation);
784     myCollation = 0;
785 }
786 
TestSecondary()787 static void TestSecondary()
788 {
789     int32_t i;
790     int32_t len;
791     UCollator *myCollation;
792     UErrorCode status=U_ZERO_ERROR;
793     static const char str[]="& C < ch, cH, Ch, CH & Five, 5 & Four, 4 & one, 1 & Ampersand; '&' & Two, 2 ";
794     UChar rules[sizeof(str)];
795     len = strlen(str);
796     u_uastrcpy(rules, str);
797 
798     myCollation=ucol_openRules(rules, len, UCOL_OFF, UCOL_DEFAULT_STRENGTH,NULL, &status);
799     if(U_FAILURE(status)){
800         log_err_status(status, "ERROR: in creation of rule based collator :%s\n", myErrorName(status));
801         return;
802     }
803     ucol_setStrength(myCollation, UCOL_SECONDARY);
804     for (i = 26; i < 34 ; i++)
805     {
806         doTest(myCollation, testSourceCases[i], testTargetCases[i], results[i]);
807     }
808     ucol_close(myCollation);
809     myCollation = 0;
810 }
811 
TestIdentical()812 static void TestIdentical()
813 {
814     int32_t i;
815     int32_t len;
816     UCollator *myCollation;
817     UErrorCode status=U_ZERO_ERROR;
818     static const char str[]="& C < ch, cH, Ch, CH & Five, 5 & Four, 4 & one, 1 & Ampersand; '&' & Two, 2 ";
819     UChar rules[sizeof(str)];
820     len = strlen(str);
821     u_uastrcpy(rules, str);
822 
823     myCollation=ucol_openRules(rules, len, UCOL_OFF, UCOL_IDENTICAL, NULL,&status);
824     if(U_FAILURE(status)){
825         log_err_status(status, "ERROR: in creation of rule based collator :%s\n", myErrorName(status));
826         return;
827     }
828     for(i= 34; i<37; i++)
829     {
830         doTest(myCollation, testSourceCases[i], testTargetCases[i], results[i]);
831     }
832     ucol_close(myCollation);
833     myCollation = 0;
834 }
835 
TestExtra()836 static void TestExtra()
837 {
838     int32_t i, j;
839     int32_t len;
840     UCollator *myCollation;
841     UErrorCode status = U_ZERO_ERROR;
842     static const char str[]="& C < ch, cH, Ch, CH & Five, 5 & Four, 4 & one, 1 & Ampersand; '&' & Two, 2 ";
843     UChar rules[sizeof(str)];
844     len = strlen(str);
845     u_uastrcpy(rules, str);
846 
847     myCollation=ucol_openRules(rules, len, UCOL_OFF, UCOL_DEFAULT_STRENGTH,NULL, &status);
848     if(U_FAILURE(status)){
849         log_err_status(status, "ERROR: in creation of rule based collator :%s\n", myErrorName(status));
850         return;
851     }
852     ucol_setStrength(myCollation, UCOL_TERTIARY);
853     for (i = 0; i < COUNT_TEST_CASES-1 ; i++)
854     {
855         for (j = i + 1; j < COUNT_TEST_CASES; j += 1)
856         {
857 
858             doTest(myCollation, testCases[i], testCases[j], UCOL_LESS);
859         }
860     }
861     ucol_close(myCollation);
862     myCollation = 0;
863 }
864 
TestJB581(void)865 static void TestJB581(void)
866 {
867     int32_t     bufferLen   = 0;
868     UChar       source      [100];
869     UChar       target      [100];
870     UCollationResult result     = UCOL_EQUAL;
871     uint8_t     sourceKeyArray  [100];
872     uint8_t     targetKeyArray  [100];
873     int32_t     sourceKeyOut    = 0,
874                 targetKeyOut    = 0;
875     UCollator   *myCollator = 0;
876     UErrorCode status = U_ZERO_ERROR;
877 
878     /*u_uastrcpy(source, "This is a test.");*/
879     /*u_uastrcpy(target, "THISISATEST.");*/
880     u_uastrcpy(source, "THISISATEST.");
881     u_uastrcpy(target, "Thisisatest.");
882 
883     myCollator = ucol_open("en_US", &status);
884     if (U_FAILURE(status)){
885         log_err_status(status, "ERROR: Failed to create the collator : %s\n", u_errorName(status));
886         return;
887     }
888     result = ucol_strcoll(myCollator, source, -1, target, -1);
889     /* result is 1, secondary differences only for ignorable space characters*/
890     if (result != 1)
891     {
892         log_err("Comparing two strings with only secondary differences in C failed.\n");
893     }
894     /* To compare them with just primary differences */
895     ucol_setStrength(myCollator, UCOL_PRIMARY);
896     result = ucol_strcoll(myCollator, source, -1, target, -1);
897     /* result is 0 */
898     if (result != 0)
899     {
900         log_err("Comparing two strings with no differences in C failed.\n");
901     }
902     /* Now, do the same comparison with keys */
903     sourceKeyOut = ucol_getSortKey(myCollator, source, -1, sourceKeyArray, 100);
904     (void)sourceKeyOut;    /* Suppress set but not used warning. */
905     targetKeyOut = ucol_getSortKey(myCollator, target, -1, targetKeyArray, 100);
906     bufferLen = ((targetKeyOut > 100) ? 100 : targetKeyOut);
907     if (memcmp(sourceKeyArray, targetKeyArray, bufferLen) != 0)
908     {
909         log_err("Comparing two strings with sort keys in C failed.\n");
910     }
911     ucol_close(myCollator);
912 }
913 
TestJB1401(void)914 static void TestJB1401(void)
915 {
916     UCollator     *myCollator = 0;
917     UErrorCode     status = U_ZERO_ERROR;
918     static UChar   NFD_UnsafeStartChars[] = {
919         0x0f73,          /* Tibetan Vowel Sign II */
920         0x0f75,          /* Tibetan Vowel Sign UU */
921         0x0f81,          /* Tibetan Vowel Sign Reversed II */
922             0
923     };
924     int            i;
925 
926 
927     myCollator = ucol_open("en_US", &status);
928     if (U_FAILURE(status)){
929         log_err_status(status, "ERROR: Failed to create the collator : %s\n", u_errorName(status));
930         return;
931     }
932     ucol_setAttribute(myCollator, UCOL_NORMALIZATION_MODE, UCOL_ON, &status);
933     if (U_FAILURE(status)){
934         log_err("ERROR: Failed to set normalization mode ON for collator.\n");
935         return;
936     }
937 
938     for (i=0; ; i++) {
939         UChar    c;
940         UChar    X[4];
941         UChar    Y[20];
942         UChar    Z[20];
943 
944         /*  Get the next funny character to be tested, and set up the
945          *  three test strings X, Y, Z, consisting of an A-grave + test char,
946          *    in original form, NFD, and then NFC form.
947          */
948         c = NFD_UnsafeStartChars[i];
949         if (c==0) {break;}
950 
951         X[0]=0xC0; X[1]=c; X[2]=0;   /* \u00C0 is A Grave*/
952 
953         unorm_normalize(X, -1, UNORM_NFD, 0, Y, 20, &status);
954         unorm_normalize(Y, -1, UNORM_NFC, 0, Z, 20, &status);
955         if (U_FAILURE(status)){
956             log_err("ERROR: Failed to normalize test of character %x\n", c);
957             return;
958         }
959 
960         /* Collation test.  All three strings should be equal.
961          *   doTest does both strcoll and sort keys, with params in both orders.
962          */
963         doTest(myCollator, X, Y, UCOL_EQUAL);
964         doTest(myCollator, X, Z, UCOL_EQUAL);
965         doTest(myCollator, Y, Z, UCOL_EQUAL);
966 
967         /* Run collation element iterators over the three strings.  Results should be same for each.
968          */
969         {
970             UCollationElements *ceiX, *ceiY, *ceiZ;
971             int32_t             ceX,   ceY,   ceZ;
972             int                 j;
973 
974             ceiX = ucol_openElements(myCollator, X, -1, &status);
975             ceiY = ucol_openElements(myCollator, Y, -1, &status);
976             ceiZ = ucol_openElements(myCollator, Z, -1, &status);
977             if (U_FAILURE(status)) {
978                 log_err("ERROR: uucol_openElements failed.\n");
979                 return;
980             }
981 
982             for (j=0;; j++) {
983                 ceX = ucol_next(ceiX, &status);
984                 ceY = ucol_next(ceiY, &status);
985                 ceZ = ucol_next(ceiZ, &status);
986                 if (U_FAILURE(status)) {
987                     log_err("ERROR: ucol_next failed for iteration #%d.\n", j);
988                     break;
989                 }
990                 if (ceX != ceY || ceY != ceZ) {
991                     log_err("ERROR: ucol_next failed for iteration #%d.\n", j);
992                     break;
993                 }
994                 if (ceX == UCOL_NULLORDER) {
995                     break;
996                 }
997             }
998             ucol_closeElements(ceiX);
999             ucol_closeElements(ceiY);
1000             ucol_closeElements(ceiZ);
1001         }
1002     }
1003     ucol_close(myCollator);
1004 }
1005 
1006 
1007 
1008 /**
1009 * Tests the [variable top] tag in rule syntax. Since the default [alternate]
1010 * tag has the value shifted, any codepoints before [variable top] should give
1011 * a primary ce of 0.
1012 */
TestVariableTop(void)1013 static void TestVariableTop(void)
1014 {
1015 #if 0
1016     /*
1017      * Starting with ICU 53, setting the variable top via a pseudo relation string
1018      * is not supported any more.
1019      * It was replaced by the [maxVariable symbol] setting.
1020      * See ICU tickets #9958 and #8032.
1021      */
1022     static const char       str[]          = "&z = [variable top]";
1023           int         len          = strlen(str);
1024           UChar      rules[sizeof(str)];
1025           UCollator  *myCollation;
1026           UCollator  *enCollation;
1027           UErrorCode  status       = U_ZERO_ERROR;
1028           UChar       source[1];
1029           UChar       ch;
1030           uint8_t     result[20];
1031           uint8_t     expected[20];
1032 
1033     u_uastrcpy(rules, str);
1034 
1035     enCollation = ucol_open("en_US", &status);
1036     if (U_FAILURE(status)) {
1037         log_err_status(status, "ERROR: in creation of collator :%s\n",
1038                 myErrorName(status));
1039         return;
1040     }
1041     myCollation = ucol_openRules(rules, len, UCOL_OFF,
1042                                  UCOL_PRIMARY,NULL, &status);
1043     if (U_FAILURE(status)) {
1044         ucol_close(enCollation);
1045         log_err("ERROR: in creation of rule based collator :%s\n",
1046                 myErrorName(status));
1047         return;
1048     }
1049 
1050     ucol_setStrength(enCollation, UCOL_PRIMARY);
1051     ucol_setAttribute(enCollation, UCOL_ALTERNATE_HANDLING, UCOL_SHIFTED,
1052                       &status);
1053     ucol_setAttribute(myCollation, UCOL_ALTERNATE_HANDLING, UCOL_SHIFTED,
1054                       &status);
1055 
1056     if (ucol_getAttribute(myCollation, UCOL_ALTERNATE_HANDLING, &status) !=
1057         UCOL_SHIFTED || U_FAILURE(status)) {
1058         log_err("ERROR: ALTERNATE_HANDLING value can not be set to SHIFTED\n");
1059     }
1060 
1061     uprv_memset(expected, 0, 20);
1062 
1063     /* space is supposed to be a variable */
1064     source[0] = ' ';
1065     len = ucol_getSortKey(enCollation, source, 1, result,
1066                           sizeof(result));
1067 
1068     if (uprv_memcmp(expected, result, len) != 0) {
1069         log_err("ERROR: SHIFTED alternate does not return 0 for primary of space\n");
1070     }
1071 
1072     ch = 'a';
1073     while (ch < 'z') {
1074         source[0] = ch;
1075         len = ucol_getSortKey(myCollation, source, 1, result,
1076                               sizeof(result));
1077         if (uprv_memcmp(expected, result, len) != 0) {
1078             log_err("ERROR: SHIFTED alternate does not return 0 for primary of %c\n",
1079                     ch);
1080         }
1081         ch ++;
1082     }
1083 
1084     ucol_close(enCollation);
1085     ucol_close(myCollation);
1086     enCollation = NULL;
1087     myCollation = NULL;
1088 #endif
1089 }
1090 
1091 /**
1092   * Tests surrogate support.
1093   * NOTE: This test used \\uD801\\uDC01 pair, which is now assigned to Desseret
1094   * Therefore, another (unassigned) code point was used for this test.
1095   */
TestSurrogates(void)1096 static void TestSurrogates(void)
1097 {
1098     static const char       str[]          =
1099                               "&z<'\\uD800\\uDC00'<'\\uD800\\uDC0A\\u0308'<A";
1100           int         len          = strlen(str);
1101           int         rlen         = 0;
1102           UChar      rules[sizeof(str)];
1103           UCollator  *myCollation;
1104           UCollator  *enCollation;
1105           UErrorCode  status       = U_ZERO_ERROR;
1106           UChar       source[][4]    =
1107           {{'z', 0, 0}, {0xD800, 0xDC00, 0}, {0xD800, 0xDC0A, 0x0308, 0}, {0xD800, 0xDC02}};
1108           UChar       target[][4]    =
1109           {{0xD800, 0xDC00, 0}, {0xD800, 0xDC0A, 0x0308, 0}, {'A', 0, 0}, {0xD800, 0xDC03}};
1110           int         count        = 0;
1111           uint8_t enresult[20], myresult[20];
1112           int enlen, mylen;
1113 
1114     /* tests for open rules with surrogate rules */
1115     rlen = u_unescape(str, rules, len);
1116 
1117     enCollation = ucol_open("en_US", &status);
1118     if (U_FAILURE(status)) {
1119         log_err_status(status, "ERROR: in creation of collator :%s\n",
1120                 myErrorName(status));
1121         return;
1122     }
1123     myCollation = ucol_openRules(rules, rlen, UCOL_OFF,
1124                                  UCOL_TERTIARY,NULL, &status);
1125     if (U_FAILURE(status)) {
1126         ucol_close(enCollation);
1127         log_err("ERROR: in creation of rule based collator :%s\n",
1128                 myErrorName(status));
1129         return;
1130     }
1131 
1132     /*
1133     this test is to verify the supplementary sort key order in the english
1134     collator
1135     */
1136     log_verbose("start of english collation supplementary characters test\n");
1137     while (count < 2) {
1138         doTest(enCollation, source[count], target[count], UCOL_LESS);
1139         count ++;
1140     }
1141     doTest(enCollation, source[count], target[count], UCOL_GREATER);
1142 
1143     log_verbose("start of tailored collation supplementary characters test\n");
1144     count = 0;
1145     /* tests getting collation elements for surrogates for tailored rules */
1146     while (count < 4) {
1147         doTest(myCollation, source[count], target[count], UCOL_LESS);
1148         count ++;
1149     }
1150 
1151     /* tests that \uD800\uDC02 still has the same value, not changed */
1152     enlen = ucol_getSortKey(enCollation, source[3], 2, enresult, 20);
1153     mylen = ucol_getSortKey(myCollation, source[3], 2, myresult, 20);
1154     if (enlen != mylen ||
1155         uprv_memcmp(enresult, myresult, enlen) != 0) {
1156         log_verbose("Failed : non-tailored supplementary characters should have the same value\n");
1157     }
1158 
1159     ucol_close(enCollation);
1160     ucol_close(myCollation);
1161     enCollation = NULL;
1162     myCollation = NULL;
1163 }
1164 
1165 /*
1166  *### TODO: Add more invalid rules to test all different scenarios.
1167  *
1168  */
1169 static void
TestInvalidRules()1170 TestInvalidRules(){
1171 #define MAX_ERROR_STATES 2
1172 
1173     static const char* rulesArr[MAX_ERROR_STATES] = {
1174         "& C < ch, cH, Ch[this should fail]<d",
1175         "& C < ch, cH, & Ch[variable top]"
1176     };
1177     static const char* preContextArr[MAX_ERROR_STATES] = {
1178         " C < ch, cH, Ch",
1179         "& C < ch, cH",
1180 
1181     };
1182     static const char* postContextArr[MAX_ERROR_STATES] = {
1183         "[this should fa",
1184         ", & Ch[variable"
1185     };
1186     int i;
1187 
1188     for(i = 0;i<MAX_ERROR_STATES;i++){
1189         UChar rules[1000]       = { '\0' };
1190         UChar preContextExp[1000]  = { '\0' };
1191         UChar postContextExp[1000] = { '\0' };
1192         UParseError parseError;
1193         UErrorCode status = U_ZERO_ERROR;
1194         UCollator* coll=0;
1195         u_charsToUChars(rulesArr[i],rules,uprv_strlen(rulesArr[i])+1);
1196         u_charsToUChars(preContextArr[i],preContextExp,uprv_strlen(preContextArr[i])+1);
1197         u_charsToUChars(postContextArr[i],postContextExp,uprv_strlen(postContextArr[i])+1);
1198         /* clean up stuff in parseError */
1199         u_memset(parseError.preContext,0x0000,U_PARSE_CONTEXT_LEN);
1200         u_memset(parseError.postContext,0x0000,U_PARSE_CONTEXT_LEN);
1201         /* open the rules and test */
1202         coll = ucol_openRules(rules,u_strlen(rules),UCOL_OFF,UCOL_DEFAULT_STRENGTH,&parseError,&status);
1203         (void)coll;   /* Suppress set but not used warning. */
1204         if(u_strcmp(parseError.preContext,preContextExp)!=0){
1205             log_err_status(status, "preContext in UParseError for ucol_openRules does not match: \"%s\"\n",
1206                            aescstrdup(parseError.preContext, -1));
1207         }
1208         if(u_strcmp(parseError.postContext,postContextExp)!=0){
1209             log_err_status(status, "postContext in UParseError for ucol_openRules does not match: \"%s\"\n",
1210                            aescstrdup(parseError.postContext, -1));
1211         }
1212     }
1213 }
1214 
1215 static void
TestJitterbug1098()1216 TestJitterbug1098(){
1217     UChar rule[1000];
1218     UCollator* c1 = NULL;
1219     UErrorCode status = U_ZERO_ERROR;
1220     UParseError parseError;
1221     char preContext[200]={0};
1222     char postContext[200]={0};
1223     int i=0;
1224     const char* rules[] = {
1225          "&''<\\\\",
1226          "&\\'<\\\\",
1227          "&\\\"<'\\'",
1228          "&'\"'<\\'",
1229          NULL
1230 
1231     };
1232     const UCollationResult results1098[] = {
1233         UCOL_LESS,
1234         UCOL_LESS,
1235         UCOL_LESS,
1236         UCOL_LESS,
1237     };
1238     const UChar input[][2]= {
1239         {0x0027,0x005c},
1240         {0x0027,0x005c},
1241         {0x0022,0x005c},
1242         {0x0022,0x0027},
1243     };
1244     UChar X[2] ={0};
1245     UChar Y[2] ={0};
1246     u_memset(parseError.preContext,0x0000,U_PARSE_CONTEXT_LEN);
1247     u_memset(parseError.postContext,0x0000,U_PARSE_CONTEXT_LEN);
1248     for(;rules[i]!=0;i++){
1249         u_uastrcpy(rule, rules[i]);
1250         c1 = ucol_openRules(rule, u_strlen(rule), UCOL_OFF, UCOL_DEFAULT_STRENGTH, &parseError, &status);
1251         if(U_FAILURE(status)){
1252             log_err_status(status, "Could not parse the rules syntax. Error: %s\n", u_errorName(status));
1253 
1254             if (status == U_PARSE_ERROR) {
1255                 u_UCharsToChars(parseError.preContext,preContext,20);
1256                 u_UCharsToChars(parseError.postContext,postContext,20);
1257                 log_verbose("\n\tPre-Context: %s \n\tPost-Context:%s \n",preContext,postContext);
1258             }
1259 
1260             return;
1261         }
1262         X[0] = input[i][0];
1263         Y[0] = input[i][1];
1264         doTest(c1,X,Y,results1098[i]);
1265         ucol_close(c1);
1266     }
1267 }
1268 
1269 static void
TestFCDCrash(void)1270 TestFCDCrash(void) {
1271     static const char *test[] = {
1272     "Gr\\u00F6\\u00DFe",
1273     "Grossist"
1274     };
1275 
1276     UErrorCode status = U_ZERO_ERROR;
1277     UCollator *coll = ucol_open("es", &status);
1278     if(U_FAILURE(status)) {
1279         log_err_status(status, "Couldn't open collator -> %s\n", u_errorName(status));
1280         return;
1281     }
1282     ucol_close(coll);
1283     coll = NULL;
1284     ctest_resetICU();
1285     coll = ucol_open("de_DE", &status);
1286     if(U_FAILURE(status)) {
1287         log_err_status(status, "Couldn't open collator -> %s\n", u_errorName(status));
1288         return;
1289     }
1290     ucol_setAttribute(coll, UCOL_NORMALIZATION_MODE, UCOL_ON, &status);
1291     genericOrderingTest(coll, test, 2);
1292     ucol_close(coll);
1293 }
1294 
1295 /*static UBool
1296 find(UEnumeration* list, const char* str, UErrorCode* status){
1297     const char* value = NULL;
1298     int32_t length=0;
1299     if(U_FAILURE(*status)){
1300         return FALSE;
1301     }
1302     uenum_reset(list, status);
1303     while( (value= uenum_next(list, &length, status))!=NULL){
1304         if(strcmp(value, str)==0){
1305             return TRUE;
1306         }
1307     }
1308     return FALSE;
1309 }*/
1310 
TestJ5298(void)1311 static void TestJ5298(void)
1312 {
1313     UErrorCode status = U_ZERO_ERROR;
1314     char input[256], output[256];
1315     UBool isAvailable;
1316     int32_t i = 0;
1317     UEnumeration* values = NULL;
1318     const char *keywordValue = NULL;
1319     log_verbose("Number of collator locales returned : %i \n", ucol_countAvailable());
1320     values = ucol_getKeywordValues("collation", &status);
1321     while ((keywordValue = uenum_next(values, NULL, &status)) != NULL) {
1322         if (strncmp(keywordValue, "private-", 8) == 0) {
1323             log_err("ucol_getKeywordValues() returns private collation keyword: %s\n", keywordValue);
1324         }
1325     }
1326     for (i = 0; i < ucol_countAvailable(); i++) {
1327         uenum_reset(values, &status);
1328         while ((keywordValue = uenum_next(values, NULL, &status)) != NULL) {
1329             strcpy(input, ucol_getAvailable(i));
1330             if (strcmp(keywordValue, "standard") != 0) {
1331                 strcat(input, "@collation=");
1332                 strcat(input, keywordValue);
1333             }
1334 
1335             ucol_getFunctionalEquivalent(output, 256, "collation", input, &isAvailable, &status);
1336             if (strcmp(input, output) == 0) { /* Unique locale, print it out */
1337                 log_verbose("%s, \n", output);
1338             }
1339         }
1340     }
1341     uenum_close(values);
1342     log_verbose("\n");
1343 }
1344 #endif /* #if !UCONFIG_NO_COLLATION */
1345