1 // © 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /*
4 *******************************************************************************
5 *
6 *   Copyright (C) 1999-2014, International Business Machines
7 *   Corporation and others.  All Rights Reserved.
8 *
9 *******************************************************************************
10 *   file name:  collationweights.h
11 *   encoding:   UTF-8
12 *   tab size:   8 (not used)
13 *   indentation:4
14 *
15 *   created on: 2001mar08 as ucol_wgt.h
16 *   created by: Markus W. Scherer
17 */
18 
19 #ifndef __COLLATIONWEIGHTS_H__
20 #define __COLLATIONWEIGHTS_H__
21 
22 #include "unicode/utypes.h"
23 
24 #if !UCONFIG_NO_COLLATION
25 
26 #include "unicode/uobject.h"
27 
28 U_NAMESPACE_BEGIN
29 
30 /**
31  * Allocates n collation element weights between two exclusive limits.
32  * Used only internally by the collation tailoring builder.
33  */
34 class U_I18N_API CollationWeights : public UMemory {
35 public:
36     CollationWeights();
37 
lengthOfWeight(uint32_t weight)38     static inline int32_t lengthOfWeight(uint32_t weight) {
39         if((weight&0xffffff)==0) {
40             return 1;
41         } else if((weight&0xffff)==0) {
42             return 2;
43         } else if((weight&0xff)==0) {
44             return 3;
45         } else {
46             return 4;
47         }
48     }
49 
50     void initForPrimary(UBool compressible);
51     void initForSecondary();
52     void initForTertiary();
53 
54     /**
55      * Determine heuristically
56      * what ranges to use for a given number of weights between (excluding)
57      * two limits.
58      *
59      * @param lowerLimit A collation element weight; the ranges will be filled to cover
60      *                   weights greater than this one.
61      * @param upperLimit A collation element weight; the ranges will be filled to cover
62      *                   weights less than this one.
63      * @param n          The number of collation element weights w necessary such that
64      *                   lowerLimit<w<upperLimit in lexical order.
65      * @return true if it is possible to fit n elements between the limits
66      */
67     UBool allocWeights(uint32_t lowerLimit, uint32_t upperLimit, int32_t n);
68 
69     /**
70      * Given a set of ranges calculated by allocWeights(),
71      * iterate through the weights.
72      * The ranges are modified to keep the current iteration state.
73      *
74      * @return The next weight in the ranges, or 0xffffffff if there is none left.
75      */
76     uint32_t nextWeight();
77 
78     /** @internal */
79     struct WeightRange {
80         uint32_t start, end;
81         int32_t length, count;
82     };
83 
84 private:
85     /** @return number of usable byte values for byte idx */
countBytes(int32_t idx)86     inline int32_t countBytes(int32_t idx) const {
87         return (int32_t)(maxBytes[idx] - minBytes[idx] + 1);
88     }
89 
90     uint32_t incWeight(uint32_t weight, int32_t length) const;
91     uint32_t incWeightByOffset(uint32_t weight, int32_t length, int32_t offset) const;
92     void lengthenRange(WeightRange &range) const;
93     /**
94      * Takes two CE weights and calculates the
95      * possible ranges of weights between the two limits, excluding them.
96      * For weights with up to 4 bytes there are up to 2*4-1=7 ranges.
97      */
98     UBool getWeightRanges(uint32_t lowerLimit, uint32_t upperLimit);
99     UBool allocWeightsInShortRanges(int32_t n, int32_t minLength);
100     UBool allocWeightsInMinLengthRanges(int32_t n, int32_t minLength);
101 
102     int32_t middleLength;
103     uint32_t minBytes[5];  // for byte 1, 2, 3, 4
104     uint32_t maxBytes[5];
105     WeightRange ranges[7];
106     int32_t rangeIndex;
107     int32_t rangeCount;
108 };
109 
110 U_NAMESPACE_END
111 
112 #endif  // !UCONFIG_NO_COLLATION
113 #endif  // __COLLATIONWEIGHTS_H__
114