]>
Commit | Line | Data |
---|---|---|
1 | // © 2016 and later: Unicode, Inc. and others. | |
2 | // License & terms of use: http://www.unicode.org/copyright.html | |
3 | /* | |
4 | ******************************************************************************* | |
5 | * | |
6 | * Copyright (C) 1999-2014, International Business Machines | |
7 | * Corporation and others. All Rights Reserved. | |
8 | * | |
9 | ******************************************************************************* | |
10 | * file name: collationweights.h | |
11 | * encoding: UTF-8 | |
12 | * tab size: 8 (not used) | |
13 | * indentation:4 | |
14 | * | |
15 | * created on: 2001mar08 as ucol_wgt.h | |
16 | * created by: Markus W. Scherer | |
17 | */ | |
18 | ||
19 | #ifndef __COLLATIONWEIGHTS_H__ | |
20 | #define __COLLATIONWEIGHTS_H__ | |
21 | ||
22 | #include "unicode/utypes.h" | |
23 | ||
24 | #if !UCONFIG_NO_COLLATION | |
25 | ||
26 | #include "unicode/uobject.h" | |
27 | ||
28 | U_NAMESPACE_BEGIN | |
29 | ||
30 | /** | |
31 | * Allocates n collation element weights between two exclusive limits. | |
32 | * Used only internally by the collation tailoring builder. | |
33 | */ | |
34 | class U_I18N_API CollationWeights : public UMemory { | |
35 | public: | |
36 | CollationWeights(); | |
37 | ||
38 | static inline int32_t lengthOfWeight(uint32_t weight) { | |
39 | if((weight&0xffffff)==0) { | |
40 | return 1; | |
41 | } else if((weight&0xffff)==0) { | |
42 | return 2; | |
43 | } else if((weight&0xff)==0) { | |
44 | return 3; | |
45 | } else { | |
46 | return 4; | |
47 | } | |
48 | } | |
49 | ||
50 | void initForPrimary(UBool compressible); | |
51 | void initForSecondary(); | |
52 | void initForTertiary(); | |
53 | ||
54 | /** | |
55 | * Determine heuristically | |
56 | * what ranges to use for a given number of weights between (excluding) | |
57 | * two limits. | |
58 | * | |
59 | * @param lowerLimit A collation element weight; the ranges will be filled to cover | |
60 | * weights greater than this one. | |
61 | * @param upperLimit A collation element weight; the ranges will be filled to cover | |
62 | * weights less than this one. | |
63 | * @param n The number of collation element weights w necessary such that | |
64 | * lowerLimit<w<upperLimit in lexical order. | |
65 | * @return TRUE if it is possible to fit n elements between the limits | |
66 | */ | |
67 | UBool allocWeights(uint32_t lowerLimit, uint32_t upperLimit, int32_t n); | |
68 | ||
69 | /** | |
70 | * Given a set of ranges calculated by allocWeights(), | |
71 | * iterate through the weights. | |
72 | * The ranges are modified to keep the current iteration state. | |
73 | * | |
74 | * @return The next weight in the ranges, or 0xffffffff if there is none left. | |
75 | */ | |
76 | uint32_t nextWeight(); | |
77 | ||
78 | /** @internal */ | |
79 | struct WeightRange { | |
80 | uint32_t start, end; | |
81 | int32_t length, count; | |
82 | }; | |
83 | ||
84 | private: | |
85 | /** @return number of usable byte values for byte idx */ | |
86 | inline int32_t countBytes(int32_t idx) const { | |
87 | return (int32_t)(maxBytes[idx] - minBytes[idx] + 1); | |
88 | } | |
89 | ||
90 | uint32_t incWeight(uint32_t weight, int32_t length) const; | |
91 | uint32_t incWeightByOffset(uint32_t weight, int32_t length, int32_t offset) const; | |
92 | void lengthenRange(WeightRange &range) const; | |
93 | /** | |
94 | * Takes two CE weights and calculates the | |
95 | * possible ranges of weights between the two limits, excluding them. | |
96 | * For weights with up to 4 bytes there are up to 2*4-1=7 ranges. | |
97 | */ | |
98 | UBool getWeightRanges(uint32_t lowerLimit, uint32_t upperLimit); | |
99 | UBool allocWeightsInShortRanges(int32_t n, int32_t minLength); | |
100 | UBool allocWeightsInMinLengthRanges(int32_t n, int32_t minLength); | |
101 | ||
102 | int32_t middleLength; | |
103 | uint32_t minBytes[5]; // for byte 1, 2, 3, 4 | |
104 | uint32_t maxBytes[5]; | |
105 | WeightRange ranges[7]; | |
106 | int32_t rangeIndex; | |
107 | int32_t rangeCount; | |
108 | }; | |
109 | ||
110 | U_NAMESPACE_END | |
111 | ||
112 | #endif // !UCONFIG_NO_COLLATION | |
113 | #endif // __COLLATIONWEIGHTS_H__ |