]>
Commit | Line | Data |
---|---|---|
9ce05555 | 1 | /* |
e29e285d | 2 | * Copyright (c) 2015 Apple Inc. All rights reserved. |
9ce05555 A |
3 | * |
4 | * @APPLE_LICENSE_HEADER_START@ | |
d7384798 | 5 | * |
9ce05555 A |
6 | * This file contains Original Code and/or Modifications of Original Code |
7 | * as defined in and that are subject to the Apple Public Source License | |
8 | * Version 2.0 (the 'License'). You may not use this file except in | |
9 | * compliance with the License. Please obtain a copy of the License at | |
10 | * http://www.opensource.apple.com/apsl/ and read it before using this | |
11 | * file. | |
d7384798 | 12 | * |
9ce05555 A |
13 | * The Original Code and all software distributed under the License are |
14 | * distributed on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER | |
15 | * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES, | |
16 | * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY, | |
17 | * FITNESS FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT. | |
18 | * Please see the License for the specific language governing rights and | |
19 | * limitations under the License. | |
d7384798 | 20 | * |
9ce05555 A |
21 | * @APPLE_LICENSE_HEADER_END@ |
22 | */ | |
f64f9b69 | 23 | |
9ce05555 | 24 | /* CFCharacterSet.c |
d7384798 | 25 | Copyright (c) 1999-2014, Apple Inc. All rights reserved. |
9ce05555 A |
26 | Responsibility: Aki Inoue |
27 | */ | |
28 | ||
29 | #include <CoreFoundation/CFCharacterSet.h> | |
30 | #include <CoreFoundation/CFByteOrder.h> | |
31 | #include "CFCharacterSetPriv.h" | |
32 | #include <CoreFoundation/CFData.h> | |
33 | #include <CoreFoundation/CFString.h> | |
34 | #include "CFInternal.h" | |
cf7d2af9 | 35 | #include <CoreFoundation/CFUniChar.h> |
9ce05555 A |
36 | #include "CFUniCharPriv.h" |
37 | #include <stdlib.h> | |
38 | #include <string.h> | |
39 | ||
9ce05555 A |
40 | |
41 | #define BITSPERBYTE 8 /* (CHAR_BIT * sizeof(unsigned char)) */ | |
42 | #define LOG_BPB 3 | |
43 | #define LOG_BPLW 5 | |
44 | #define NUMCHARACTERS 65536 | |
45 | ||
46 | #define MAX_ANNEX_PLANE (16) | |
47 | ||
48 | /* Number of things in the array keeping the bits. | |
49 | */ | |
50 | #define __kCFBitmapSize (NUMCHARACTERS / BITSPERBYTE) | |
51 | ||
52 | /* How many elements max can be in an __kCFCharSetClassString CFCharacterSet | |
53 | */ | |
54 | #define __kCFStringCharSetMax 64 | |
55 | ||
56 | /* The last builtin set ID number | |
57 | */ | |
bd5b749c | 58 | #define __kCFLastBuiltinSetID kCFCharacterSetNewline |
9ce05555 A |
59 | |
60 | /* How many elements in the "singles" array before we use binary search. | |
61 | */ | |
62 | #define __kCFSetBreakeven 10 | |
63 | ||
64 | /* This tells us, within 1k or so, whether a thing is POTENTIALLY in the set (in the bitmap blob of the private structure) before we bother to do specific checking. | |
65 | */ | |
66 | #define __CFCSetBitsInRange(n, i) (i[n>>15] & (1L << ((n>>10) % 32))) | |
67 | ||
68 | /* Compact bitmap params | |
69 | */ | |
70 | #define __kCFCompactBitmapNumPages (256) | |
71 | ||
72 | #define __kCFCompactBitmapMaxPages (128) // the max pages allocated | |
73 | ||
74 | #define __kCFCompactBitmapPageSize (__kCFBitmapSize / __kCFCompactBitmapNumPages) | |
75 | ||
76 | typedef struct { | |
77 | CFCharacterSetRef *_nonBMPPlanes; | |
78 | unsigned int _validEntriesBitmap; | |
79 | unsigned char _numOfAllocEntries; | |
80 | unsigned char _isAnnexInverted; | |
d8925383 | 81 | uint16_t _padding; |
9ce05555 A |
82 | } CFCharSetAnnexStruct; |
83 | ||
84 | struct __CFCharacterSet { | |
85 | CFRuntimeBase _base; | |
86 | CFHashCode _hashValue; | |
87 | union { | |
88 | struct { | |
89 | CFIndex _type; | |
90 | } _builtin; | |
91 | struct { | |
92 | UInt32 _firstChar; | |
93 | CFIndex _length; | |
94 | } _range; | |
95 | struct { | |
96 | UniChar *_buffer; | |
97 | CFIndex _length; | |
98 | } _string; | |
99 | struct { | |
100 | uint8_t *_bits; | |
101 | } _bitmap; | |
102 | struct { | |
103 | uint8_t *_cBits; | |
104 | } _compactBitmap; | |
105 | } _variants; | |
106 | CFCharSetAnnexStruct *_annex; | |
107 | }; | |
108 | ||
109 | /* _base._info values interesting for CFCharacterSet | |
110 | */ | |
111 | enum { | |
112 | __kCFCharSetClassTypeMask = 0x0070, | |
113 | __kCFCharSetClassBuiltin = 0x0000, | |
114 | __kCFCharSetClassRange = 0x0010, | |
115 | __kCFCharSetClassString = 0x0020, | |
116 | __kCFCharSetClassBitmap = 0x0030, | |
117 | __kCFCharSetClassSet = 0x0040, | |
118 | __kCFCharSetClassCompactBitmap = 0x0040, | |
119 | ||
120 | __kCFCharSetIsInvertedMask = 0x0008, | |
121 | __kCFCharSetIsInverted = 0x0008, | |
122 | ||
123 | __kCFCharSetHasHashValueMask = 0x00004, | |
124 | __kCFCharSetHasHashValue = 0x0004, | |
125 | ||
126 | /* Generic CFBase values */ | |
127 | __kCFCharSetIsMutableMask = 0x0001, | |
128 | __kCFCharSetIsMutable = 0x0001, | |
129 | }; | |
130 | ||
131 | /* Inline accessor macros for _base._info | |
132 | */ | |
bd5b749c A |
133 | CF_INLINE Boolean __CFCSetIsMutable(CFCharacterSetRef cset) {return (cset->_base._cfinfo[CF_INFO_BITS] & __kCFCharSetIsMutableMask) == __kCFCharSetIsMutable;} |
134 | CF_INLINE Boolean __CFCSetIsBuiltin(CFCharacterSetRef cset) {return (cset->_base._cfinfo[CF_INFO_BITS] & __kCFCharSetClassTypeMask) == __kCFCharSetClassBuiltin;} | |
135 | CF_INLINE Boolean __CFCSetIsRange(CFCharacterSetRef cset) {return (cset->_base._cfinfo[CF_INFO_BITS] & __kCFCharSetClassTypeMask) == __kCFCharSetClassRange;} | |
136 | CF_INLINE Boolean __CFCSetIsString(CFCharacterSetRef cset) {return (cset->_base._cfinfo[CF_INFO_BITS] & __kCFCharSetClassTypeMask) == __kCFCharSetClassString;} | |
137 | CF_INLINE Boolean __CFCSetIsBitmap(CFCharacterSetRef cset) {return (cset->_base._cfinfo[CF_INFO_BITS] & __kCFCharSetClassTypeMask) == __kCFCharSetClassBitmap;} | |
138 | CF_INLINE Boolean __CFCSetIsCompactBitmap(CFCharacterSetRef cset) {return (cset->_base._cfinfo[CF_INFO_BITS] & __kCFCharSetClassTypeMask) == __kCFCharSetClassCompactBitmap;} | |
139 | CF_INLINE Boolean __CFCSetIsInverted(CFCharacterSetRef cset) {return (cset->_base._cfinfo[CF_INFO_BITS] & __kCFCharSetIsInvertedMask) == __kCFCharSetIsInverted;} | |
140 | CF_INLINE Boolean __CFCSetHasHashValue(CFCharacterSetRef cset) {return (cset->_base._cfinfo[CF_INFO_BITS] & __kCFCharSetHasHashValueMask) == __kCFCharSetHasHashValue;} | |
141 | CF_INLINE UInt32 __CFCSetClassType(CFCharacterSetRef cset) {return (cset->_base._cfinfo[CF_INFO_BITS] & __kCFCharSetClassTypeMask);} | |
142 | ||
143 | CF_INLINE void __CFCSetPutIsMutable(CFMutableCharacterSetRef cset, Boolean isMutable) {(isMutable ? (cset->_base._cfinfo[CF_INFO_BITS] |= __kCFCharSetIsMutable) : (cset->_base._cfinfo[CF_INFO_BITS] &= ~ __kCFCharSetIsMutable));} | |
144 | CF_INLINE void __CFCSetPutIsInverted(CFMutableCharacterSetRef cset, Boolean isInverted) {(isInverted ? (cset->_base._cfinfo[CF_INFO_BITS] |= __kCFCharSetIsInverted) : (cset->_base._cfinfo[CF_INFO_BITS] &= ~__kCFCharSetIsInverted));} | |
145 | CF_INLINE void __CFCSetPutHasHashValue(CFMutableCharacterSetRef cset, Boolean hasHash) {(hasHash ? (cset->_base._cfinfo[CF_INFO_BITS] |= __kCFCharSetHasHashValue) : (cset->_base._cfinfo[CF_INFO_BITS] &= ~__kCFCharSetHasHashValue));} | |
146 | CF_INLINE void __CFCSetPutClassType(CFMutableCharacterSetRef cset, UInt32 classType) {cset->_base._cfinfo[CF_INFO_BITS] &= ~__kCFCharSetClassTypeMask; cset->_base._cfinfo[CF_INFO_BITS] |= classType;} | |
9ce05555 | 147 | |
a48904a4 | 148 | CF_PRIVATE Boolean __CFCharacterSetIsMutable(CFCharacterSetRef cset) {return __CFCSetIsMutable(cset);} |
9ce05555 A |
149 | |
150 | /* Inline contents accessor macros | |
151 | */ | |
152 | CF_INLINE CFCharacterSetPredefinedSet __CFCSetBuiltinType(CFCharacterSetRef cset) {return cset->_variants._builtin._type;} | |
153 | CF_INLINE UInt32 __CFCSetRangeFirstChar(CFCharacterSetRef cset) {return cset->_variants._range._firstChar;} | |
154 | CF_INLINE CFIndex __CFCSetRangeLength(CFCharacterSetRef cset) {return cset->_variants._range._length;} | |
155 | CF_INLINE UniChar *__CFCSetStringBuffer(CFCharacterSetRef cset) {return (UniChar*)(cset->_variants._string._buffer);} | |
156 | CF_INLINE CFIndex __CFCSetStringLength(CFCharacterSetRef cset) {return cset->_variants._string._length;} | |
157 | CF_INLINE uint8_t *__CFCSetBitmapBits(CFCharacterSetRef cset) {return cset->_variants._bitmap._bits;} | |
158 | CF_INLINE uint8_t *__CFCSetCompactBitmapBits(CFCharacterSetRef cset) {return cset->_variants._compactBitmap._cBits;} | |
159 | ||
160 | CF_INLINE void __CFCSetPutBuiltinType(CFMutableCharacterSetRef cset, CFCharacterSetPredefinedSet type) {cset->_variants._builtin._type = type;} | |
161 | CF_INLINE void __CFCSetPutRangeFirstChar(CFMutableCharacterSetRef cset, UInt32 first) {cset->_variants._range._firstChar = first;} | |
162 | CF_INLINE void __CFCSetPutRangeLength(CFMutableCharacterSetRef cset, CFIndex length) {cset->_variants._range._length = length;} | |
163 | CF_INLINE void __CFCSetPutStringBuffer(CFMutableCharacterSetRef cset, UniChar *theBuffer) {cset->_variants._string._buffer = theBuffer;} | |
164 | CF_INLINE void __CFCSetPutStringLength(CFMutableCharacterSetRef cset, CFIndex length) {cset->_variants._string._length = length;} | |
165 | CF_INLINE void __CFCSetPutBitmapBits(CFMutableCharacterSetRef cset, uint8_t *bits) {cset->_variants._bitmap._bits = bits;} | |
166 | CF_INLINE void __CFCSetPutCompactBitmapBits(CFMutableCharacterSetRef cset, uint8_t *bits) {cset->_variants._compactBitmap._cBits = bits;} | |
167 | ||
168 | /* Validation funcs | |
169 | */ | |
170 | #if defined(CF_ENABLE_ASSERTIONS) | |
171 | CF_INLINE void __CFCSetValidateBuiltinType(CFCharacterSetPredefinedSet type, const char *func) { | |
172 | CFAssert2(type > 0 && type <= __kCFLastBuiltinSetID, __kCFLogAssertion, "%s: Unknowen builtin type %d", func, type); | |
173 | } | |
174 | CF_INLINE void __CFCSetValidateRange(CFRange theRange, const char *func) { | |
175 | CFAssert3(theRange.location >= 0 && theRange.location + theRange.length <= 0x1FFFFF, __kCFLogAssertion, "%s: Range out of Unicode range (location -> %d length -> %d)", func, theRange.location, theRange.length); | |
176 | } | |
177 | CF_INLINE void __CFCSetValidateTypeAndMutability(CFCharacterSetRef cset, const char *func) { | |
178 | __CFGenericValidateType(cset, __kCFCharacterSetTypeID); | |
179 | CFAssert1(__CFCSetIsMutable(cset), __kCFLogAssertion, "%s: Immutable character set passed to mutable function", func); | |
180 | } | |
181 | #else | |
182 | #define __CFCSetValidateBuiltinType(t,f) | |
183 | #define __CFCSetValidateRange(r,f) | |
184 | #define __CFCSetValidateTypeAndMutability(r,f) | |
185 | #endif | |
186 | ||
187 | /* Inline utility funcs | |
188 | */ | |
189 | static Boolean __CFCSetIsEqualBitmap(const UInt32 *bits1, const UInt32 *bits2) { | |
190 | CFIndex length = __kCFBitmapSize / sizeof(UInt32); | |
191 | ||
192 | if (bits1 == bits2) { | |
193 | return true; | |
194 | } else if (bits1 && bits2) { | |
195 | if (bits1 == (const UInt32 *)-1) { | |
196 | while (length--) if ((UInt32)-1 != *bits2++) return false; | |
197 | } else if (bits2 == (const UInt32 *)-1) { | |
198 | while (length--) if ((UInt32)-1 != *bits1++) return false; | |
199 | } else { | |
200 | while (length--) if (*bits1++ != *bits2++) return false; | |
201 | } | |
202 | return true; | |
203 | } else if (!bits1 && !bits2) { // empty set | |
204 | return true; | |
205 | } else { | |
206 | if (bits2) bits1 = bits2; | |
207 | if (bits1 == (const UInt32 *)-1) return false; | |
208 | while (length--) if (*bits1++) return false; | |
209 | return true; | |
210 | } | |
211 | } | |
212 | ||
213 | CF_INLINE Boolean __CFCSetIsEqualBitmapInverted(const UInt32 *bits1, const UInt32 *bits2) { | |
214 | CFIndex length = __kCFBitmapSize / sizeof(UInt32); | |
215 | ||
216 | while (length--) if (*bits1++ != ~(*(bits2++))) return false; | |
217 | return true; | |
218 | } | |
219 | ||
220 | static Boolean __CFCSetIsBitmapEqualToRange(const UInt32 *bits, UniChar firstChar, UniChar lastChar, Boolean isInverted) { | |
221 | CFIndex firstCharIndex = firstChar >> LOG_BPB; | |
222 | CFIndex lastCharIndex = lastChar >> LOG_BPB; | |
223 | CFIndex length; | |
224 | UInt32 value; | |
225 | ||
226 | if (firstCharIndex == lastCharIndex) { | |
227 | value = ((((UInt32)0xFF) << (firstChar & (BITSPERBYTE - 1))) & (((UInt32)0xFF) >> ((BITSPERBYTE - 1) - (lastChar & (BITSPERBYTE - 1))))) << (((sizeof(UInt32) - 1) - (firstCharIndex % sizeof(UInt32))) * BITSPERBYTE); | |
228 | value = CFSwapInt32HostToBig(value); | |
229 | firstCharIndex = lastCharIndex = firstChar >> LOG_BPLW; | |
230 | if (*(bits + firstCharIndex) != (isInverted ? ~value : value)) return FALSE; | |
231 | } else { | |
232 | UInt32 firstCharMask; | |
233 | UInt32 lastCharMask; | |
234 | ||
235 | length = firstCharIndex % sizeof(UInt32); | |
bd5b749c | 236 | firstCharMask = (((((UInt32)0xFF) << (firstChar & (BITSPERBYTE - 1))) & 0xFF) << (((sizeof(UInt32) - 1) - length) * BITSPERBYTE)) | (((UInt32)0xFFFFFFFF) >> ((length + 1) * BITSPERBYTE)); |
9ce05555 A |
237 | |
238 | length = lastCharIndex % sizeof(UInt32); | |
bd5b749c | 239 | lastCharMask = ((((UInt32)0xFF) >> ((BITSPERBYTE - 1) - (lastChar & (BITSPERBYTE - 1)))) << (((sizeof(UInt32) - 1) - length) * BITSPERBYTE)) | (((UInt32)0xFFFFFFFF) << ((sizeof(UInt32) - length) * BITSPERBYTE)); |
9ce05555 A |
240 | |
241 | firstCharIndex = firstChar >> LOG_BPLW; | |
242 | lastCharIndex = lastChar >> LOG_BPLW; | |
243 | ||
244 | if (firstCharIndex == lastCharIndex) { | |
245 | firstCharMask &= lastCharMask; | |
246 | value = CFSwapInt32HostToBig(firstCharMask & lastCharMask); | |
247 | if (*(bits + firstCharIndex) != (isInverted ? ~value : value)) return FALSE; | |
248 | } else { | |
249 | value = CFSwapInt32HostToBig(firstCharMask); | |
250 | if (*(bits + firstCharIndex) != (isInverted ? ~value : value)) return FALSE; | |
251 | ||
252 | value = CFSwapInt32HostToBig(lastCharMask); | |
253 | if (*(bits + lastCharIndex) != (isInverted ? ~value : value)) return FALSE; | |
254 | } | |
255 | } | |
256 | ||
257 | length = firstCharIndex; | |
bd5b749c | 258 | value = (isInverted ? ((UInt32)0xFFFFFFFF) : 0); |
9ce05555 A |
259 | while (length--) { |
260 | if (*(bits++) != value) return FALSE; | |
261 | } | |
262 | ||
263 | ++bits; // Skip firstCharIndex | |
264 | length = (lastCharIndex - (firstCharIndex + 1)); | |
bd5b749c | 265 | value = (isInverted ? 0 : ((UInt32)0xFFFFFFFF)); |
9ce05555 A |
266 | while (length-- > 0) { |
267 | if (*(bits++) != value) return FALSE; | |
268 | } | |
269 | if (firstCharIndex != lastCharIndex) ++bits; | |
270 | ||
271 | length = (0xFFFF >> LOG_BPLW) - lastCharIndex; | |
bd5b749c | 272 | value = (isInverted ? ((UInt32)0xFFFFFFFF) : 0); |
9ce05555 A |
273 | while (length--) { |
274 | if (*(bits++) != value) return FALSE; | |
275 | } | |
276 | ||
277 | return TRUE; | |
278 | } | |
279 | ||
280 | CF_INLINE Boolean __CFCSetIsBitmapSupersetOfBitmap(const UInt32 *bits1, const UInt32 *bits2, Boolean isInverted1, Boolean isInverted2) { | |
281 | CFIndex length = __kCFBitmapSize / sizeof(UInt32); | |
282 | UInt32 val1, val2; | |
283 | ||
284 | while (length--) { | |
285 | val2 = (isInverted2 ? ~(*(bits2++)) : *(bits2++)); | |
286 | val1 = (isInverted1 ? ~(*(bits1++)) : *(bits1++)) & val2; | |
287 | if (val1 != val2) return false; | |
288 | } | |
289 | ||
290 | return true; | |
291 | } | |
292 | ||
293 | CF_INLINE Boolean __CFCSetHasNonBMPPlane(CFCharacterSetRef cset) { return ((cset)->_annex && (cset)->_annex->_validEntriesBitmap ? true : false); } | |
294 | CF_INLINE Boolean __CFCSetAnnexIsInverted (CFCharacterSetRef cset) { return ((cset)->_annex && (cset)->_annex->_isAnnexInverted ? true : false); } | |
bd5b749c | 295 | CF_INLINE UInt32 __CFCSetAnnexValidEntriesBitmap(CFCharacterSetRef cset) { return ((cset)->_annex ? (cset)->_annex->_validEntriesBitmap : 0); } |
9ce05555 A |
296 | |
297 | CF_INLINE Boolean __CFCSetIsEmpty(CFCharacterSetRef cset) { | |
298 | if (__CFCSetHasNonBMPPlane(cset) || __CFCSetAnnexIsInverted(cset)) return false; | |
299 | ||
300 | switch (__CFCSetClassType(cset)) { | |
301 | case __kCFCharSetClassRange: if (!__CFCSetRangeLength(cset)) return true; break; | |
302 | case __kCFCharSetClassString: if (!__CFCSetStringLength(cset)) return true; break; | |
303 | case __kCFCharSetClassBitmap: if (!__CFCSetBitmapBits(cset)) return true; break; | |
304 | case __kCFCharSetClassCompactBitmap: if (!__CFCSetCompactBitmapBits(cset)) return true; break; | |
305 | } | |
306 | return false; | |
307 | } | |
308 | ||
309 | CF_INLINE void __CFCSetBitmapAddCharacter(uint8_t *bitmap, UniChar theChar) { | |
310 | bitmap[(theChar) >> LOG_BPB] |= (((unsigned)1) << (theChar & (BITSPERBYTE - 1))); | |
311 | } | |
312 | ||
313 | CF_INLINE void __CFCSetBitmapRemoveCharacter(uint8_t *bitmap, UniChar theChar) { | |
314 | bitmap[(theChar) >> LOG_BPB] &= ~(((unsigned)1) << (theChar & (BITSPERBYTE - 1))); | |
315 | } | |
316 | ||
317 | CF_INLINE Boolean __CFCSetIsMemberBitmap(const uint8_t *bitmap, UniChar theChar) { | |
318 | return ((bitmap[(theChar) >> LOG_BPB] & (((unsigned)1) << (theChar & (BITSPERBYTE - 1)))) ? true : false); | |
319 | } | |
320 | ||
321 | #define NUM_32BIT_SLOTS (NUMCHARACTERS / 32) | |
322 | ||
323 | CF_INLINE void __CFCSetBitmapFastFillWithValue(UInt32 *bitmap, uint8_t value) { | |
324 | UInt32 mask = (value << 24) | (value << 16) | (value << 8) | value; | |
325 | UInt32 numSlots = NUMCHARACTERS / 32; | |
326 | ||
327 | while (numSlots--) *(bitmap++) = mask; | |
328 | } | |
329 | ||
330 | CF_INLINE void __CFCSetBitmapAddCharactersInRange(uint8_t *bitmap, UniChar firstChar, UniChar lastChar) { | |
331 | if (firstChar == lastChar) { | |
332 | bitmap[firstChar >> LOG_BPB] |= (((unsigned)1) << (firstChar & (BITSPERBYTE - 1))); | |
333 | } else { | |
334 | UInt32 idx = firstChar >> LOG_BPB; | |
335 | UInt32 max = lastChar >> LOG_BPB; | |
336 | ||
337 | if (idx == max) { | |
338 | bitmap[idx] |= (((unsigned)0xFF) << (firstChar & (BITSPERBYTE - 1))) & (((unsigned)0xFF) >> ((BITSPERBYTE - 1) - (lastChar & (BITSPERBYTE - 1)))); | |
339 | } else { | |
340 | bitmap[idx] |= (((unsigned)0xFF) << (firstChar & (BITSPERBYTE - 1))); | |
341 | bitmap[max] |= (((unsigned)0xFF) >> ((BITSPERBYTE - 1) - (lastChar & (BITSPERBYTE - 1)))); | |
342 | ||
343 | ++idx; | |
344 | while (idx < max) bitmap[idx++] = 0xFF; | |
345 | } | |
346 | } | |
347 | } | |
348 | ||
349 | CF_INLINE void __CFCSetBitmapRemoveCharactersInRange(uint8_t *bitmap, UniChar firstChar, UniChar lastChar) { | |
350 | UInt32 idx = firstChar >> LOG_BPB; | |
351 | UInt32 max = lastChar >> LOG_BPB; | |
352 | ||
353 | if (idx == max) { | |
354 | bitmap[idx] &= ~((((unsigned)0xFF) << (firstChar & (BITSPERBYTE - 1))) & (((unsigned)0xFF) >> ((BITSPERBYTE - 1) - (lastChar & (BITSPERBYTE - 1))))); | |
355 | } else { | |
356 | bitmap[idx] &= ~(((unsigned)0xFF) << (firstChar & (BITSPERBYTE - 1))); | |
357 | bitmap[max] &= ~(((unsigned)0xFF) >> ((BITSPERBYTE - 1) - (lastChar & (BITSPERBYTE - 1)))); | |
358 | ||
359 | ++idx; | |
360 | while (idx < max) bitmap[idx++] = 0; | |
361 | } | |
362 | } | |
363 | ||
364 | #define __CFCSetAnnexBitmapSetPlane(bitmap,plane) ((bitmap) |= (1 << (plane))) | |
365 | #define __CFCSetAnnexBitmapClearPlane(bitmap,plane) ((bitmap) &= (~(1 << (plane)))) | |
366 | #define __CFCSetAnnexBitmapGetPlane(bitmap,plane) ((bitmap) & (1 << (plane))) | |
367 | ||
9ce05555 A |
368 | CF_INLINE void __CFCSetAllocateAnnexForPlane(CFCharacterSetRef cset, int plane) { |
369 | if (cset->_annex == NULL) { | |
370 | ((CFMutableCharacterSetRef)cset)->_annex = (CFCharSetAnnexStruct *)CFAllocatorAllocate(CFGetAllocator(cset), sizeof(CFCharSetAnnexStruct), 0); | |
371 | cset->_annex->_numOfAllocEntries = plane; | |
372 | cset->_annex->_isAnnexInverted = false; | |
373 | cset->_annex->_validEntriesBitmap = 0; | |
bd5b749c | 374 | cset->_annex->_nonBMPPlanes = ((plane > 0) ? (CFCharacterSetRef*)CFAllocatorAllocate(CFGetAllocator(cset), sizeof(CFCharacterSetRef) * plane, 0) : NULL); |
9ce05555 A |
375 | } else if (cset->_annex->_numOfAllocEntries < plane) { |
376 | cset->_annex->_numOfAllocEntries = plane; | |
bd5b749c A |
377 | if (NULL == cset->_annex->_nonBMPPlanes) { |
378 | cset->_annex->_nonBMPPlanes = (CFCharacterSetRef*)CFAllocatorAllocate(CFGetAllocator(cset), sizeof(CFCharacterSetRef) * plane, 0); | |
379 | } else { | |
380 | cset->_annex->_nonBMPPlanes = (CFCharacterSetRef*)CFAllocatorReallocate(CFGetAllocator(cset), (void *)cset->_annex->_nonBMPPlanes, sizeof(CFCharacterSetRef) * plane, 0); | |
381 | } | |
9ce05555 A |
382 | } |
383 | } | |
384 | ||
bd5b749c A |
385 | CF_INLINE void __CFCSetAnnexSetIsInverted(CFCharacterSetRef cset, Boolean flag) { |
386 | if (flag) __CFCSetAllocateAnnexForPlane(cset, 0); | |
387 | if (cset->_annex) ((CFMutableCharacterSetRef)cset)->_annex->_isAnnexInverted = flag; | |
388 | } | |
389 | ||
9ce05555 A |
390 | CF_INLINE void __CFCSetPutCharacterSetToAnnexPlane(CFCharacterSetRef cset, CFCharacterSetRef annexCSet, int plane) { |
391 | __CFCSetAllocateAnnexForPlane(cset, plane); | |
392 | if (__CFCSetAnnexBitmapGetPlane(cset->_annex->_validEntriesBitmap, plane)) CFRelease(cset->_annex->_nonBMPPlanes[plane - 1]); | |
393 | if (annexCSet) { | |
bd5b749c | 394 | cset->_annex->_nonBMPPlanes[plane - 1] = (CFCharacterSetRef)CFRetain(annexCSet); |
9ce05555 A |
395 | __CFCSetAnnexBitmapSetPlane(cset->_annex->_validEntriesBitmap, plane); |
396 | } else { | |
397 | __CFCSetAnnexBitmapClearPlane(cset->_annex->_validEntriesBitmap, plane); | |
398 | } | |
399 | } | |
400 | ||
401 | CF_INLINE CFCharacterSetRef __CFCSetGetAnnexPlaneCharacterSet(CFCharacterSetRef cset, int plane) { | |
402 | __CFCSetAllocateAnnexForPlane(cset, plane); | |
403 | if (!__CFCSetAnnexBitmapGetPlane(cset->_annex->_validEntriesBitmap, plane)) { | |
404 | cset->_annex->_nonBMPPlanes[plane - 1] = (CFCharacterSetRef)CFCharacterSetCreateMutable(CFGetAllocator(cset)); | |
405 | __CFCSetAnnexBitmapSetPlane(cset->_annex->_validEntriesBitmap, plane); | |
406 | } | |
407 | return cset->_annex->_nonBMPPlanes[plane - 1]; | |
408 | } | |
409 | ||
410 | CF_INLINE CFCharacterSetRef __CFCSetGetAnnexPlaneCharacterSetNoAlloc(CFCharacterSetRef cset, int plane) { | |
411 | return (cset->_annex && __CFCSetAnnexBitmapGetPlane(cset->_annex->_validEntriesBitmap, plane) ? cset->_annex->_nonBMPPlanes[plane - 1] : NULL); | |
412 | } | |
413 | ||
414 | CF_INLINE void __CFCSetDeallocateAnnexPlane(CFCharacterSetRef cset) { | |
415 | if (cset->_annex) { | |
416 | int idx; | |
417 | ||
418 | for (idx = 0;idx < MAX_ANNEX_PLANE;idx++) { | |
419 | if (__CFCSetAnnexBitmapGetPlane(cset->_annex->_validEntriesBitmap, idx + 1)) { | |
420 | CFRelease(cset->_annex->_nonBMPPlanes[idx]); | |
421 | } | |
422 | } | |
423 | CFAllocatorDeallocate(CFGetAllocator(cset), cset->_annex->_nonBMPPlanes); | |
424 | CFAllocatorDeallocate(CFGetAllocator(cset), cset->_annex); | |
425 | ((CFMutableCharacterSetRef)cset)->_annex = NULL; | |
426 | } | |
427 | } | |
428 | ||
429 | CF_INLINE uint8_t __CFCSetGetHeaderValue(const uint8_t *bitmap, int *numPages) { | |
430 | uint8_t value = *bitmap; | |
431 | ||
432 | if ((value == 0) || (value == UINT8_MAX)) { | |
433 | int numBytes = __kCFCompactBitmapPageSize - 1; | |
434 | ||
435 | while (numBytes > 0) { | |
436 | if (*(++bitmap) != value) break; | |
437 | --numBytes; | |
438 | } | |
439 | if (numBytes == 0) return value; | |
440 | } | |
441 | return (uint8_t)(++(*numPages)); | |
442 | } | |
443 | ||
444 | CF_INLINE bool __CFCSetIsMemberInCompactBitmap(const uint8_t *compactBitmap, UTF16Char character) { | |
445 | uint8_t value = compactBitmap[(character >> 8)]; // Assuming __kCFCompactBitmapNumPages == 256 | |
446 | ||
447 | if (value == 0) { | |
448 | return false; | |
449 | } else if (value == UINT8_MAX) { | |
450 | return true; | |
451 | } else { | |
452 | compactBitmap += (__kCFCompactBitmapNumPages + (__kCFCompactBitmapPageSize * (value - 1))); | |
453 | character &= 0xFF; // Assuming __kCFCompactBitmapNumPages == 256 | |
454 | return ((compactBitmap[(character / BITSPERBYTE)] & (1 << (character % BITSPERBYTE))) ? true : false); | |
455 | } | |
456 | } | |
457 | ||
458 | CF_INLINE uint32_t __CFCSetGetCompactBitmapSize(const uint8_t *compactBitmap) { | |
459 | uint32_t length = __kCFCompactBitmapNumPages; | |
460 | uint32_t size = __kCFCompactBitmapNumPages; | |
461 | uint8_t value; | |
462 | ||
463 | while (length-- > 0) { | |
464 | value = *(compactBitmap++); | |
465 | if ((value != 0) && (value != UINT8_MAX)) size += __kCFCompactBitmapPageSize; | |
466 | } | |
467 | return size; | |
468 | } | |
469 | ||
9ce05555 A |
470 | CF_INLINE void __CFExpandCompactBitmap(const uint8_t *src, uint8_t *dst) { |
471 | const uint8_t *srcBody = src + __kCFCompactBitmapNumPages; | |
472 | int i; | |
473 | uint8_t value; | |
474 | ||
475 | for (i = 0;i < __kCFCompactBitmapNumPages;i++) { | |
476 | value = *(src++); | |
477 | if ((value == 0) || (value == UINT8_MAX)) { | |
478 | memset(dst, value, __kCFCompactBitmapPageSize); | |
479 | } else { | |
480 | memmove(dst, srcBody, __kCFCompactBitmapPageSize); | |
481 | srcBody += __kCFCompactBitmapPageSize; | |
482 | } | |
483 | dst += __kCFCompactBitmapPageSize; | |
484 | } | |
485 | } | |
486 | ||
487 | ||
488 | static void __CFCheckForExpandedSet(CFCharacterSetRef cset) { | |
489 | static int8_t __CFNumberOfPlanesForLogging = -1; | |
490 | static bool warnedOnce = false; | |
491 | ||
492 | if (0 > __CFNumberOfPlanesForLogging) { | |
cf7d2af9 | 493 | const char *envVar = __CFgetenv("CFCharacterSetCheckForExpandedSet"); |
bd5b749c A |
494 | long value = (envVar ? strtol_l(envVar, NULL, 0, NULL) : 0); |
495 | __CFNumberOfPlanesForLogging = (int8_t)(((value > 0) && (value <= 16)) ? value : 0); | |
9ce05555 A |
496 | } |
497 | ||
498 | if (__CFNumberOfPlanesForLogging) { | |
499 | uint32_t entries = __CFCSetAnnexValidEntriesBitmap(cset); | |
500 | int count = 0; | |
501 | ||
502 | while (entries) { | |
503 | if ((entries & 1) && (++count >= __CFNumberOfPlanesForLogging)) { | |
504 | if (!warnedOnce) { | |
bd5b749c | 505 | CFLog(kCFLogLevelWarning, CFSTR("An expanded CFMutableCharacter has been detected. Recommend to compact with CFCharacterSetCreateCopy")); |
9ce05555 A |
506 | warnedOnce = true; |
507 | } | |
508 | break; | |
509 | } | |
510 | entries >>= 1; | |
511 | } | |
512 | } | |
513 | } | |
514 | ||
515 | static void __CFCSetGetBitmap(CFCharacterSetRef cset, uint8_t *bits) { | |
516 | uint8_t *bitmap; | |
517 | CFIndex length = __kCFBitmapSize; | |
518 | ||
519 | if (__CFCSetIsBitmap(cset) && (bitmap = __CFCSetBitmapBits(cset))) { | |
520 | memmove(bits, bitmap, __kCFBitmapSize); | |
521 | } else { | |
522 | Boolean isInverted = __CFCSetIsInverted(cset); | |
523 | uint8_t value = (isInverted ? (uint8_t)-1 : 0); | |
524 | ||
525 | bitmap = bits; | |
526 | while (length--) *bitmap++ = value; // Initialize the buffer | |
527 | ||
528 | if (!__CFCSetIsEmpty(cset)) { | |
529 | switch (__CFCSetClassType(cset)) { | |
530 | case __kCFCharSetClassBuiltin: { | |
bd5b749c | 531 | UInt8 result = CFUniCharGetBitmapForPlane(__CFCSetBuiltinType(cset), 0, bits, (isInverted != 0)); |
9ce05555 A |
532 | if (result == kCFUniCharBitmapEmpty && isInverted) { |
533 | length = __kCFBitmapSize; | |
534 | bitmap = bits; | |
535 | while (length--) *bitmap++ = 0; | |
536 | } else if (result == kCFUniCharBitmapAll && !isInverted) { | |
537 | length = __kCFBitmapSize; | |
538 | bitmap = bits; | |
539 | while (length--) *bitmap++ = (UInt8)0xFF; | |
540 | } | |
541 | } | |
542 | break; | |
543 | ||
544 | case __kCFCharSetClassRange: { | |
545 | UInt32 theChar = __CFCSetRangeFirstChar(cset); | |
546 | if (theChar < NUMCHARACTERS) { // the range starts in BMP | |
547 | length = __CFCSetRangeLength(cset); | |
548 | if (theChar + length >= NUMCHARACTERS) length = NUMCHARACTERS - theChar; | |
549 | if (isInverted) { | |
bd5b749c | 550 | __CFCSetBitmapRemoveCharactersInRange(bits, theChar, (UniChar)(theChar + length) - 1); |
9ce05555 | 551 | } else { |
bd5b749c | 552 | __CFCSetBitmapAddCharactersInRange(bits, theChar, (UniChar)(theChar + length) - 1); |
9ce05555 A |
553 | } |
554 | } | |
555 | } | |
556 | break; | |
557 | ||
558 | case __kCFCharSetClassString: { | |
559 | const UniChar *buffer = __CFCSetStringBuffer(cset); | |
560 | length = __CFCSetStringLength(cset); | |
561 | while (length--) (isInverted ? __CFCSetBitmapRemoveCharacter(bits, *buffer++) : __CFCSetBitmapAddCharacter(bits, *buffer++)); | |
562 | } | |
563 | break; | |
564 | ||
565 | case __kCFCharSetClassCompactBitmap: | |
566 | __CFExpandCompactBitmap(__CFCSetCompactBitmapBits(cset), bits); | |
567 | break; | |
568 | } | |
569 | } | |
570 | } | |
571 | } | |
572 | ||
573 | static Boolean __CFCharacterSetEqual(CFTypeRef cf1, CFTypeRef cf2); | |
574 | ||
575 | static Boolean __CFCSetIsEqualAnnex(CFCharacterSetRef cf1, CFCharacterSetRef cf2) { | |
576 | CFCharacterSetRef subSet1; | |
577 | CFCharacterSetRef subSet2; | |
578 | Boolean isAnnexInvertStateIdentical = (__CFCSetAnnexIsInverted(cf1) == __CFCSetAnnexIsInverted(cf2) ? true: false); | |
579 | int idx; | |
580 | ||
581 | if (isAnnexInvertStateIdentical) { | |
582 | if (__CFCSetAnnexValidEntriesBitmap(cf1) != __CFCSetAnnexValidEntriesBitmap(cf2)) return false; | |
583 | for (idx = 1;idx <= MAX_ANNEX_PLANE;idx++) { | |
584 | subSet1 = __CFCSetGetAnnexPlaneCharacterSetNoAlloc(cf1, idx); | |
585 | subSet2 = __CFCSetGetAnnexPlaneCharacterSetNoAlloc(cf2, idx); | |
586 | ||
587 | if (subSet1 && !__CFCharacterSetEqual(subSet1, subSet2)) return false; | |
588 | } | |
589 | } else { | |
590 | uint8_t bitsBuf[__kCFBitmapSize]; | |
9ce05555 | 591 | uint8_t bitsBuf2[__kCFBitmapSize]; |
9ce05555 A |
592 | |
593 | for (idx = 1;idx <= MAX_ANNEX_PLANE;idx++) { | |
594 | subSet1 = __CFCSetGetAnnexPlaneCharacterSetNoAlloc(cf1, idx); | |
595 | subSet2 = __CFCSetGetAnnexPlaneCharacterSetNoAlloc(cf2, idx); | |
596 | ||
597 | if (subSet1 == NULL && subSet2 == NULL) { | |
9ce05555 A |
598 | return false; |
599 | } else if (subSet1 == NULL) { | |
600 | if (__CFCSetIsBitmap(subSet2)) { | |
601 | if (!__CFCSetIsEqualBitmap((const UInt32 *)__CFCSetBitmapBits(subSet2), (const UInt32 *)-1)) { | |
9ce05555 A |
602 | return false; |
603 | } | |
604 | } else { | |
605 | __CFCSetGetBitmap(subSet2, bitsBuf); | |
606 | if (!__CFCSetIsEqualBitmap((const UInt32 *)bitsBuf, (const UInt32 *)-1)) { | |
9ce05555 A |
607 | return false; |
608 | } | |
609 | } | |
610 | } else if (subSet2 == NULL) { | |
611 | if (__CFCSetIsBitmap(subSet1)) { | |
612 | if (!__CFCSetIsEqualBitmap((const UInt32 *)__CFCSetBitmapBits(subSet1), (const UInt32 *)-1)) { | |
9ce05555 A |
613 | return false; |
614 | } | |
615 | } else { | |
616 | __CFCSetGetBitmap(subSet1, bitsBuf); | |
617 | if (!__CFCSetIsEqualBitmap((const UInt32 *)bitsBuf, (const UInt32 *)-1)) { | |
9ce05555 A |
618 | return false; |
619 | } | |
620 | } | |
621 | } else { | |
622 | Boolean isBitmap1 = __CFCSetIsBitmap(subSet1); | |
623 | Boolean isBitmap2 = __CFCSetIsBitmap(subSet2); | |
624 | ||
625 | if (isBitmap1 && isBitmap2) { | |
626 | if (!__CFCSetIsEqualBitmapInverted((const UInt32 *)__CFCSetBitmapBits(subSet1), (const UInt32 *)__CFCSetBitmapBits(subSet2))) { | |
9ce05555 A |
627 | return false; |
628 | } | |
629 | } else if (!isBitmap1 && !isBitmap2) { | |
630 | __CFCSetGetBitmap(subSet1, bitsBuf); | |
9ce05555 A |
631 | __CFCSetGetBitmap(subSet2, bitsBuf2); |
632 | if (!__CFCSetIsEqualBitmapInverted((const UInt32 *)bitsBuf, (const UInt32 *)bitsBuf2)) { | |
9ce05555 A |
633 | return false; |
634 | } | |
635 | } else { | |
636 | if (isBitmap2) { | |
637 | CFCharacterSetRef tmp = subSet2; | |
638 | subSet2 = subSet1; | |
639 | subSet1 = tmp; | |
640 | } | |
641 | __CFCSetGetBitmap(subSet2, bitsBuf); | |
642 | if (!__CFCSetIsEqualBitmapInverted((const UInt32 *)__CFCSetBitmapBits(subSet1), (const UInt32 *)bitsBuf)) { | |
9ce05555 A |
643 | return false; |
644 | } | |
645 | } | |
646 | } | |
647 | } | |
648 | } | |
649 | return true; | |
650 | } | |
651 | ||
652 | /* Compact bitmap | |
653 | */ | |
654 | static uint8_t *__CFCreateCompactBitmap(CFAllocatorRef allocator, const uint8_t *bitmap) { | |
655 | const uint8_t *src; | |
656 | uint8_t *dst; | |
657 | int i; | |
658 | int numPages = 0; | |
659 | uint8_t header[__kCFCompactBitmapNumPages]; | |
660 | ||
661 | src = bitmap; | |
662 | for (i = 0;i < __kCFCompactBitmapNumPages;i++) { | |
663 | header[i] = __CFCSetGetHeaderValue(src, &numPages); | |
664 | ||
665 | // Allocating more pages is probably not interesting enough to be compact | |
666 | if (numPages > __kCFCompactBitmapMaxPages) return NULL; | |
667 | src += __kCFCompactBitmapPageSize; | |
668 | } | |
669 | ||
bd5b749c | 670 | dst = (uint8_t *)CFAllocatorAllocate(allocator, __kCFCompactBitmapNumPages + (__kCFCompactBitmapPageSize * numPages), 0); |
9ce05555 A |
671 | |
672 | if (numPages > 0) { | |
673 | uint8_t *dstBody = dst + __kCFCompactBitmapNumPages; | |
674 | ||
675 | src = bitmap; | |
676 | for (i = 0;i < __kCFCompactBitmapNumPages;i++) { | |
677 | dst[i] = header[i]; | |
678 | ||
679 | if ((dst[i] != 0) && (dst[i] != UINT8_MAX)) { | |
680 | memmove(dstBody, src, __kCFCompactBitmapPageSize); | |
681 | dstBody += __kCFCompactBitmapPageSize; | |
682 | } | |
683 | src += __kCFCompactBitmapPageSize; | |
684 | } | |
685 | } else { | |
686 | memmove(dst, header, __kCFCompactBitmapNumPages); | |
687 | } | |
688 | ||
689 | return dst; | |
690 | } | |
691 | ||
692 | static void __CFCSetMakeCompact(CFMutableCharacterSetRef cset) { | |
693 | if (__CFCSetIsBitmap(cset) && __CFCSetBitmapBits(cset)) { | |
694 | uint8_t *bitmap = __CFCSetBitmapBits(cset); | |
695 | uint8_t *cBitmap = __CFCreateCompactBitmap(CFGetAllocator(cset), bitmap); | |
696 | ||
697 | if (cBitmap) { | |
698 | CFAllocatorDeallocate(CFGetAllocator(cset), bitmap); | |
699 | __CFCSetPutClassType(cset, __kCFCharSetClassCompactBitmap); | |
700 | __CFCSetPutCompactBitmapBits(cset, cBitmap); | |
701 | } | |
702 | } | |
703 | } | |
704 | ||
705 | static void __CFCSetAddNonBMPPlanesInRange(CFMutableCharacterSetRef cset, CFRange range) { | |
706 | int firstChar = (range.location & 0xFFFF); | |
707 | int maxChar = range.location + range.length; | |
708 | int idx = range.location >> 16; // first plane | |
709 | int maxPlane = (maxChar - 1) >> 16; // last plane | |
710 | CFRange planeRange; | |
711 | CFMutableCharacterSetRef annexPlane; | |
712 | ||
713 | maxChar &= 0xFFFF; | |
714 | ||
715 | for (idx = (idx ? idx : 1);idx <= maxPlane;idx++) { | |
716 | planeRange.location = __CFMax(firstChar, 0); | |
717 | planeRange.length = (idx == maxPlane && maxChar ? maxChar : 0x10000) - planeRange.location; | |
718 | if (__CFCSetAnnexIsInverted(cset)) { | |
719 | if ((annexPlane = (CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSetNoAlloc(cset, idx))) { | |
720 | CFCharacterSetRemoveCharactersInRange(annexPlane, planeRange); | |
721 | if (__CFCSetIsEmpty(annexPlane) && !__CFCSetIsInverted(annexPlane)) { | |
722 | CFRelease(annexPlane); | |
723 | __CFCSetAnnexBitmapClearPlane(cset->_annex->_validEntriesBitmap, idx); | |
724 | } | |
725 | } | |
726 | } else { | |
727 | CFCharacterSetAddCharactersInRange((CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSet(cset, idx), planeRange); | |
728 | } | |
729 | } | |
730 | if (!__CFCSetHasNonBMPPlane(cset) && !__CFCSetAnnexIsInverted(cset)) __CFCSetDeallocateAnnexPlane(cset); | |
731 | } | |
732 | ||
733 | static void __CFCSetRemoveNonBMPPlanesInRange(CFMutableCharacterSetRef cset, CFRange range) { | |
734 | int firstChar = (range.location & 0xFFFF); | |
735 | int maxChar = range.location + range.length; | |
736 | int idx = range.location >> 16; // first plane | |
737 | int maxPlane = (maxChar - 1) >> 16; // last plane | |
738 | CFRange planeRange; | |
739 | CFMutableCharacterSetRef annexPlane; | |
740 | ||
741 | maxChar &= 0xFFFF; | |
742 | ||
743 | for (idx = (idx ? idx : 1);idx <= maxPlane;idx++) { | |
744 | planeRange.location = __CFMax(firstChar, 0); | |
745 | planeRange.length = (idx == maxPlane && maxChar ? maxChar : 0x10000) - planeRange.location; | |
746 | if (__CFCSetAnnexIsInverted(cset)) { | |
747 | CFCharacterSetAddCharactersInRange((CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSet(cset, idx), planeRange); | |
748 | } else { | |
749 | if ((annexPlane = (CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSetNoAlloc(cset, idx))) { | |
750 | CFCharacterSetRemoveCharactersInRange(annexPlane, planeRange); | |
751 | if(__CFCSetIsEmpty(annexPlane) && !__CFCSetIsInverted(annexPlane)) { | |
752 | CFRelease(annexPlane); | |
753 | __CFCSetAnnexBitmapClearPlane(cset->_annex->_validEntriesBitmap, idx); | |
754 | } | |
755 | } | |
756 | } | |
757 | } | |
758 | if (!__CFCSetHasNonBMPPlane(cset) && !__CFCSetAnnexIsInverted(cset)) __CFCSetDeallocateAnnexPlane(cset); | |
759 | } | |
760 | ||
761 | static void __CFCSetMakeBitmap(CFMutableCharacterSetRef cset) { | |
762 | if (!__CFCSetIsBitmap(cset) || !__CFCSetBitmapBits(cset)) { | |
d8925383 | 763 | CFAllocatorRef allocator = CFGetAllocator(cset); |
bd5b749c | 764 | uint8_t *bitmap = (uint8_t *)CFAllocatorAllocate(allocator, __kCFBitmapSize, 0); |
9ce05555 A |
765 | __CFCSetGetBitmap(cset, bitmap); |
766 | ||
767 | if (__CFCSetIsBuiltin(cset)) { | |
768 | CFIndex numPlanes = CFUniCharGetNumberOfPlanes(__CFCSetBuiltinType(cset)); | |
769 | ||
770 | if (numPlanes > 1) { | |
771 | CFMutableCharacterSetRef annexSet; | |
772 | uint8_t *annexBitmap = NULL; | |
773 | int idx; | |
774 | UInt8 result; | |
775 | ||
776 | __CFCSetAllocateAnnexForPlane(cset, numPlanes - 1); | |
777 | for (idx = 1;idx < numPlanes;idx++) { | |
d8925383 | 778 | if (NULL == annexBitmap) { |
bd5b749c | 779 | annexBitmap = (uint8_t *)CFAllocatorAllocate(allocator, __kCFBitmapSize, 0); |
d8925383 | 780 | } |
9ce05555 A |
781 | result = CFUniCharGetBitmapForPlane(__CFCSetBuiltinType(cset), idx, annexBitmap, false); |
782 | if (result == kCFUniCharBitmapEmpty) continue; | |
783 | if (result == kCFUniCharBitmapAll) { | |
784 | CFIndex bitmapLength = __kCFBitmapSize; | |
785 | uint8_t *bytes = annexBitmap; | |
786 | while (bitmapLength-- > 0) *(bytes++) = (uint8_t)0xFF; | |
787 | } | |
788 | annexSet = (CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSet(cset, idx); | |
789 | __CFCSetPutClassType(annexSet, __kCFCharSetClassBitmap); | |
790 | __CFCSetPutBitmapBits(annexSet, annexBitmap); | |
791 | __CFCSetPutIsInverted(annexSet, false); | |
792 | __CFCSetPutHasHashValue(annexSet, false); | |
793 | annexBitmap = NULL; | |
794 | } | |
d8925383 | 795 | if (annexBitmap) CFAllocatorDeallocate(allocator, annexBitmap); |
9ce05555 A |
796 | } |
797 | } else if (__CFCSetIsCompactBitmap(cset) && __CFCSetCompactBitmapBits(cset)) { | |
d8925383 | 798 | CFAllocatorDeallocate(allocator, __CFCSetCompactBitmapBits(cset)); |
9ce05555 A |
799 | __CFCSetPutCompactBitmapBits(cset, NULL); |
800 | } else if (__CFCSetIsString(cset) && __CFCSetStringBuffer(cset)) { | |
d8925383 | 801 | CFAllocatorDeallocate(allocator, __CFCSetStringBuffer(cset)); |
9ce05555 A |
802 | __CFCSetPutStringBuffer(cset, NULL); |
803 | } else if (__CFCSetIsRange(cset)) { // We may have to allocate annex here | |
804 | Boolean needsToInvert = (!__CFCSetHasNonBMPPlane(cset) && __CFCSetIsInverted(cset) ? true : false); | |
805 | __CFCSetAddNonBMPPlanesInRange(cset, CFRangeMake(__CFCSetRangeFirstChar(cset), __CFCSetRangeLength(cset))); | |
806 | if (needsToInvert) __CFCSetAnnexSetIsInverted(cset, true); | |
807 | } | |
808 | __CFCSetPutClassType(cset, __kCFCharSetClassBitmap); | |
809 | __CFCSetPutBitmapBits(cset, bitmap); | |
810 | __CFCSetPutIsInverted(cset, false); | |
811 | } | |
812 | } | |
813 | ||
814 | CF_INLINE CFMutableCharacterSetRef __CFCSetGenericCreate(CFAllocatorRef allocator, UInt32 flags) { | |
815 | CFMutableCharacterSetRef cset; | |
816 | CFIndex size = sizeof(struct __CFCharacterSet) - sizeof(CFRuntimeBase); | |
817 | ||
818 | cset = (CFMutableCharacterSetRef)_CFRuntimeCreateInstance(allocator, CFCharacterSetGetTypeID(), size, NULL); | |
819 | if (NULL == cset) return NULL; | |
820 | ||
bd5b749c | 821 | cset->_base._cfinfo[CF_INFO_BITS] |= flags; |
9ce05555 A |
822 | cset->_hashValue = 0; |
823 | cset->_annex = NULL; | |
824 | ||
825 | return cset; | |
826 | } | |
827 | ||
cf7d2af9 A |
828 | static void __CFApplySurrogatesInString(CFMutableCharacterSetRef cset, CFStringRef string, void (*applyer)(CFMutableCharacterSetRef, CFRange)) { |
829 | CFStringInlineBuffer buffer; | |
830 | CFIndex index, length = CFStringGetLength(string); | |
831 | CFRange range = CFRangeMake(0, 0); | |
832 | UTF32Char character; | |
833 | ||
834 | CFStringInitInlineBuffer(string, &buffer, CFRangeMake(0, length)); | |
835 | ||
836 | for (index = 0;index < length;index++) { | |
837 | character = __CFStringGetCharacterFromInlineBufferQuick(&buffer, index); | |
838 | ||
839 | if (CFStringIsSurrogateHighCharacter(character) && ((index + 1) < length)) { | |
840 | UTF16Char other = __CFStringGetCharacterFromInlineBufferQuick(&buffer, index + 1); | |
841 | ||
842 | if (CFStringIsSurrogateLowCharacter(other)) { | |
843 | character = CFStringGetLongCharacterForSurrogatePair(character, other); | |
844 | ||
845 | if ((range.length + range.location) == character) { | |
846 | ++range.length; | |
847 | } else { | |
848 | if (range.length > 0) applyer(cset, range); | |
849 | range.location = character; | |
850 | range.length = 1; | |
851 | } | |
852 | } | |
853 | ||
854 | ++index; // skip the low surrogate | |
855 | } | |
856 | } | |
857 | ||
858 | if (range.length > 0) applyer(cset, range); | |
859 | } | |
860 | ||
861 | ||
9ce05555 A |
862 | /* Bsearch theChar for __kCFCharSetClassString |
863 | */ | |
864 | CF_INLINE Boolean __CFCSetBsearchUniChar(const UniChar *theTable, CFIndex length, UniChar theChar) { | |
865 | const UniChar *p, *q, *divider; | |
866 | ||
867 | if ((theChar < theTable[0]) || (theChar > theTable[length - 1])) return false; | |
868 | ||
869 | p = theTable; | |
870 | q = p + (length - 1); | |
871 | while (p <= q) { | |
872 | divider = p + ((q - p) >> 1); /* divide by 2 */ | |
873 | if (theChar < *divider) q = divider - 1; | |
874 | else if (theChar > *divider) p = divider + 1; | |
875 | else return true; | |
876 | } | |
877 | return false; | |
878 | } | |
879 | ||
9ce05555 A |
880 | /* Array of instantiated builtin set. Note builtin set ID starts with 1 so the array index is ID - 1 |
881 | */ | |
882 | static CFCharacterSetRef *__CFBuiltinSets = NULL; | |
883 | ||
884 | /* Global lock for character set | |
885 | */ | |
d7384798 | 886 | static OSSpinLock __CFCharacterSetLock = OS_SPINLOCK_INIT; |
9ce05555 A |
887 | |
888 | /* CFBase API functions | |
889 | */ | |
890 | static Boolean __CFCharacterSetEqual(CFTypeRef cf1, CFTypeRef cf2) { | |
bd5b749c A |
891 | Boolean isInvertStateIdentical = (__CFCSetIsInverted((CFCharacterSetRef)cf1) == __CFCSetIsInverted((CFCharacterSetRef)cf2) ? true: false); |
892 | Boolean isAnnexInvertStateIdentical = (__CFCSetAnnexIsInverted((CFCharacterSetRef)cf1) == __CFCSetAnnexIsInverted((CFCharacterSetRef)cf2) ? true: false); | |
9ce05555 A |
893 | CFIndex idx; |
894 | CFCharacterSetRef subSet1; | |
895 | uint8_t bitsBuf[__kCFBitmapSize]; | |
896 | uint8_t *bits; | |
897 | Boolean isBitmap1; | |
898 | Boolean isBitmap2; | |
899 | ||
bd5b749c A |
900 | if (__CFCSetHasHashValue((CFCharacterSetRef)cf1) && __CFCSetHasHashValue((CFCharacterSetRef)cf2) && ((CFCharacterSetRef)cf1)->_hashValue != ((CFCharacterSetRef)cf2)->_hashValue) return false; |
901 | if (__CFCSetIsEmpty((CFCharacterSetRef)cf1) && __CFCSetIsEmpty((CFCharacterSetRef)cf2) && !isInvertStateIdentical) return false; | |
9ce05555 | 902 | |
a48904a4 | 903 | if ((__CFCSetClassType((CFCharacterSetRef)cf1) == __CFCSetClassType((CFCharacterSetRef)cf2)) && !__CFCSetIsCompactBitmap((CFCharacterSetRef)cf1)) { // Types are identical, we can do it fast |
bd5b749c | 904 | switch (__CFCSetClassType((CFCharacterSetRef)cf1)) { |
9ce05555 | 905 | case __kCFCharSetClassBuiltin: |
bd5b749c | 906 | return (__CFCSetBuiltinType((CFCharacterSetRef)cf1) == __CFCSetBuiltinType((CFCharacterSetRef)cf2) && isInvertStateIdentical ? true : false); |
9ce05555 A |
907 | |
908 | case __kCFCharSetClassRange: | |
bd5b749c | 909 | return (__CFCSetRangeFirstChar((CFCharacterSetRef)cf1) == __CFCSetRangeFirstChar((CFCharacterSetRef)cf2) && __CFCSetRangeLength((CFCharacterSetRef)cf1) && __CFCSetRangeLength((CFCharacterSetRef)cf2) && isInvertStateIdentical ? true : false); |
9ce05555 A |
910 | |
911 | case __kCFCharSetClassString: | |
a48904a4 | 912 | if (isInvertStateIdentical) { |
bd5b749c | 913 | const UniChar *buf1 = __CFCSetStringBuffer((CFCharacterSetRef)cf1); |
a48904a4 | 914 | const UniChar *buf1End = buf1 + __CFCSetStringLength((CFCharacterSetRef)cf1); |
bd5b749c | 915 | const UniChar *buf2 = __CFCSetStringBuffer((CFCharacterSetRef)cf2); |
a48904a4 | 916 | const UniChar *buf2End = buf2 + __CFCSetStringLength((CFCharacterSetRef)cf2); |
9ce05555 | 917 | |
a48904a4 A |
918 | while ((buf1 < buf1End) && (buf2 < buf2End)) { |
919 | UniChar char1 = *buf1; | |
920 | UniChar char2 = *buf2; | |
921 | ||
922 | if (char1 != char2) return false; | |
923 | ||
924 | do { ++buf1; } while ((buf1 < buf1End) && (char1 == *buf1)); | |
925 | do { ++buf2; } while ((buf2 < buf2End) && (char2 == *buf2)); | |
926 | } | |
9ce05555 A |
927 | } else { |
928 | return false; | |
929 | } | |
930 | break; | |
931 | ||
932 | case __kCFCharSetClassBitmap: | |
bd5b749c | 933 | if (!__CFCSetIsEqualBitmap((const UInt32 *)__CFCSetBitmapBits((CFCharacterSetRef)cf1), (const UInt32 *)__CFCSetBitmapBits((CFCharacterSetRef)cf2))) return false; |
9ce05555 A |
934 | break; |
935 | } | |
bd5b749c | 936 | return __CFCSetIsEqualAnnex((CFCharacterSetRef)cf1, (CFCharacterSetRef)cf2); |
9ce05555 A |
937 | } |
938 | ||
939 | // Check for easy empty cases | |
bd5b749c A |
940 | if (__CFCSetIsEmpty((CFCharacterSetRef)cf1) || __CFCSetIsEmpty((CFCharacterSetRef)cf2)) { |
941 | CFCharacterSetRef emptySet = (__CFCSetIsEmpty((CFCharacterSetRef)cf1) ? (CFCharacterSetRef)cf1 : (CFCharacterSetRef)cf2); | |
942 | CFCharacterSetRef nonEmptySet = (emptySet == cf1 ? (CFCharacterSetRef)cf2 : (CFCharacterSetRef)cf1); | |
9ce05555 A |
943 | |
944 | if (__CFCSetIsBuiltin(nonEmptySet)) { | |
945 | return false; | |
946 | } else if (__CFCSetIsRange(nonEmptySet)) { | |
947 | if (isInvertStateIdentical) { | |
948 | return (__CFCSetRangeLength(nonEmptySet) ? false : true); | |
949 | } else { | |
950 | return (__CFCSetRangeLength(nonEmptySet) == 0x110000 ? true : false); | |
951 | } | |
952 | } else { | |
953 | if (__CFCSetAnnexIsInverted(nonEmptySet)) { | |
954 | if (__CFCSetAnnexValidEntriesBitmap(nonEmptySet) != 0x1FFFE) return false; | |
955 | } else { | |
956 | if (__CFCSetAnnexValidEntriesBitmap(nonEmptySet)) return false; | |
957 | } | |
958 | ||
959 | if (__CFCSetIsBitmap(nonEmptySet)) { | |
960 | bits = __CFCSetBitmapBits(nonEmptySet); | |
961 | } else { | |
962 | bits = bitsBuf; | |
963 | __CFCSetGetBitmap(nonEmptySet, bitsBuf); | |
964 | } | |
965 | ||
966 | if (__CFCSetIsEqualBitmap(NULL, (const UInt32 *)bits)) { | |
967 | if (!__CFCSetAnnexIsInverted(nonEmptySet)) return true; | |
968 | } else { | |
969 | return false; | |
970 | } | |
971 | ||
972 | // Annex set has to be CFRangeMake(0x10000, 0xfffff) | |
973 | for (idx = 1;idx < MAX_ANNEX_PLANE;idx++) { | |
974 | if (__CFCSetIsBitmap(nonEmptySet)) { | |
975 | if (!__CFCSetIsEqualBitmap((__CFCSetAnnexIsInverted(nonEmptySet) ? NULL : (const UInt32 *)-1), (const UInt32 *)bitsBuf)) return false; | |
976 | } else { | |
977 | __CFCSetGetBitmap(__CFCSetGetAnnexPlaneCharacterSetNoAlloc(nonEmptySet, idx), bitsBuf); | |
978 | if (!__CFCSetIsEqualBitmap((const UInt32 *)-1, (const UInt32 *)bitsBuf)) return false; | |
979 | } | |
980 | } | |
981 | return true; | |
982 | } | |
983 | } | |
984 | ||
bd5b749c A |
985 | if (__CFCSetIsBuiltin((CFCharacterSetRef)cf1) || __CFCSetIsBuiltin((CFCharacterSetRef)cf2)) { |
986 | CFCharacterSetRef builtinSet = (__CFCSetIsBuiltin((CFCharacterSetRef)cf1) ? (CFCharacterSetRef)cf1 : (CFCharacterSetRef)cf2); | |
987 | CFCharacterSetRef nonBuiltinSet = (builtinSet == cf1 ? (CFCharacterSetRef)cf2 : (CFCharacterSetRef)cf1); | |
9ce05555 A |
988 | |
989 | ||
990 | if (__CFCSetIsRange(nonBuiltinSet)) { | |
991 | UTF32Char firstChar = __CFCSetRangeFirstChar(nonBuiltinSet); | |
992 | UTF32Char lastChar = (firstChar + __CFCSetRangeLength(nonBuiltinSet) - 1); | |
993 | uint8_t firstPlane = (firstChar >> 16) & 0xFF; | |
994 | uint8_t lastPlane = (lastChar >> 16) & 0xFF; | |
995 | uint8_t result; | |
996 | ||
997 | for (idx = 0;idx < MAX_ANNEX_PLANE;idx++) { | |
bd5b749c | 998 | result = CFUniCharGetBitmapForPlane(__CFCSetBuiltinType(builtinSet), idx, bitsBuf, (isInvertStateIdentical != 0)); |
9ce05555 A |
999 | |
1000 | if (idx < firstPlane || idx > lastPlane) { | |
1001 | if (result == kCFUniCharBitmapAll) { | |
1002 | return false; | |
1003 | } else if (result == kCFUniCharBitmapFilled) { | |
1004 | if (!__CFCSetIsEqualBitmap(NULL, (const UInt32 *)bitsBuf)) return false; | |
1005 | } | |
1006 | } else if (idx > firstPlane && idx < lastPlane) { | |
1007 | if (result == kCFUniCharBitmapEmpty) { | |
1008 | return false; | |
1009 | } else if (result == kCFUniCharBitmapFilled) { | |
1010 | if (!__CFCSetIsEqualBitmap((const UInt32 *)-1, (const UInt32 *)bitsBuf)) return false; | |
1011 | } | |
1012 | } else { | |
1013 | if (result == kCFUniCharBitmapEmpty) { | |
1014 | return false; | |
1015 | } else if (result == kCFUniCharBitmapAll) { | |
1016 | if (idx == firstPlane) { | |
1017 | if (((firstChar & 0xFFFF) != 0) || (firstPlane == lastPlane && ((lastChar & 0xFFFF) != 0xFFFF))) return false; | |
1018 | } else { | |
1019 | if (((lastChar & 0xFFFF) != 0xFFFF) || (firstPlane == lastPlane && ((firstChar & 0xFFFF) != 0))) return false; | |
1020 | } | |
1021 | } else { | |
1022 | if (idx == firstPlane) { | |
1023 | if (!__CFCSetIsBitmapEqualToRange((const UInt32 *)bitsBuf, firstChar & 0xFFFF, (firstPlane == lastPlane ? lastChar & 0xFFFF : 0xFFFF), false)) return false; | |
1024 | } else { | |
1025 | if (!__CFCSetIsBitmapEqualToRange((const UInt32 *)bitsBuf, (firstPlane == lastPlane ? firstChar & 0xFFFF : 0), lastChar & 0xFFFF, false)) return false; | |
1026 | } | |
1027 | } | |
1028 | } | |
1029 | } | |
1030 | return true; | |
1031 | } else { | |
9ce05555 | 1032 | uint8_t bitsBuf2[__kCFBitmapSize]; |
9ce05555 A |
1033 | uint8_t result; |
1034 | ||
bd5b749c | 1035 | result = CFUniCharGetBitmapForPlane(__CFCSetBuiltinType(builtinSet), 0, bitsBuf, (__CFCSetIsInverted(builtinSet) != 0)); |
9ce05555 A |
1036 | if (result == kCFUniCharBitmapFilled) { |
1037 | if (__CFCSetIsBitmap(nonBuiltinSet)) { | |
1038 | if (!__CFCSetIsEqualBitmap((const UInt32 *)bitsBuf, (const UInt32 *)__CFCSetBitmapBits(nonBuiltinSet))) return false; | |
1039 | } else { | |
9ce05555 A |
1040 | |
1041 | __CFCSetGetBitmap(nonBuiltinSet, bitsBuf2); | |
1042 | if (!__CFCSetIsEqualBitmap((const UInt32 *)bitsBuf, (const UInt32 *)bitsBuf2)) { | |
9ce05555 A |
1043 | return false; |
1044 | } | |
1045 | } | |
1046 | } else { | |
1047 | if (__CFCSetIsBitmap(nonBuiltinSet)) { | |
1048 | if (!__CFCSetIsEqualBitmap((result == kCFUniCharBitmapAll ? (const UInt32*)-1 : NULL), (const UInt32 *)__CFCSetBitmapBits(nonBuiltinSet))) return false; | |
1049 | } else { | |
1050 | __CFCSetGetBitmap(nonBuiltinSet, bitsBuf); | |
1051 | if (!__CFCSetIsEqualBitmap((result == kCFUniCharBitmapAll ? (const UInt32*)-1: NULL), (const UInt32 *)bitsBuf)) return false; | |
1052 | } | |
1053 | } | |
1054 | ||
1055 | isInvertStateIdentical = (__CFCSetIsInverted(builtinSet) == __CFCSetAnnexIsInverted(nonBuiltinSet) ? true : false); | |
1056 | ||
1057 | for (idx = 1;idx < MAX_ANNEX_PLANE;idx++) { | |
1058 | result = CFUniCharGetBitmapForPlane(__CFCSetBuiltinType(builtinSet), idx, bitsBuf, !isInvertStateIdentical); | |
1059 | subSet1 = __CFCSetGetAnnexPlaneCharacterSetNoAlloc(nonBuiltinSet, idx); | |
1060 | ||
1061 | if (result == kCFUniCharBitmapFilled) { | |
1062 | if (NULL == subSet1) { | |
9ce05555 A |
1063 | return false; |
1064 | } else if (__CFCSetIsBitmap(subSet1)) { | |
1065 | if (!__CFCSetIsEqualBitmap((const UInt32*)bitsBuf, (const UInt32*)__CFCSetBitmapBits(subSet1))) { | |
9ce05555 A |
1066 | return false; |
1067 | } | |
1068 | } else { | |
9ce05555 A |
1069 | |
1070 | __CFCSetGetBitmap(subSet1, bitsBuf2); | |
1071 | if (!__CFCSetIsEqualBitmap((const UInt32*)bitsBuf, (const UInt32*)bitsBuf2)) { | |
9ce05555 A |
1072 | return false; |
1073 | } | |
1074 | } | |
1075 | } else { | |
1076 | if (NULL == subSet1) { | |
1077 | if (result == kCFUniCharBitmapAll) { | |
9ce05555 A |
1078 | return false; |
1079 | } | |
1080 | } else if (__CFCSetIsBitmap(subSet1)) { | |
1081 | if (!__CFCSetIsEqualBitmap((result == kCFUniCharBitmapAll ? (const UInt32*)-1: NULL), (const UInt32*)__CFCSetBitmapBits(subSet1))) { | |
9ce05555 A |
1082 | return false; |
1083 | } | |
1084 | } else { | |
1085 | __CFCSetGetBitmap(subSet1, bitsBuf); | |
1086 | if (!__CFCSetIsEqualBitmap((result == kCFUniCharBitmapAll ? (const UInt32*)-1: NULL), (const UInt32*)bitsBuf)) { | |
9ce05555 A |
1087 | return false; |
1088 | } | |
1089 | } | |
1090 | } | |
1091 | } | |
9ce05555 A |
1092 | return true; |
1093 | } | |
1094 | } | |
1095 | ||
bd5b749c A |
1096 | if (__CFCSetIsRange((CFCharacterSetRef)cf1) || __CFCSetIsRange((CFCharacterSetRef)cf2)) { |
1097 | CFCharacterSetRef rangeSet = (__CFCSetIsRange((CFCharacterSetRef)cf1) ? (CFCharacterSetRef)cf1 : (CFCharacterSetRef)cf2); | |
1098 | CFCharacterSetRef nonRangeSet = (rangeSet == cf1 ? (CFCharacterSetRef)cf2 : (CFCharacterSetRef)cf1); | |
9ce05555 A |
1099 | UTF32Char firstChar = __CFCSetRangeFirstChar(rangeSet); |
1100 | UTF32Char lastChar = (firstChar + __CFCSetRangeLength(rangeSet) - 1); | |
1101 | uint8_t firstPlane = (firstChar >> 16) & 0xFF; | |
1102 | uint8_t lastPlane = (lastChar >> 16) & 0xFF; | |
1103 | Boolean isRangeSetInverted = __CFCSetIsInverted(rangeSet); | |
1104 | ||
1105 | if (__CFCSetIsBitmap(nonRangeSet)) { | |
1106 | bits = __CFCSetBitmapBits(nonRangeSet); | |
1107 | } else { | |
1108 | bits = bitsBuf; | |
1109 | __CFCSetGetBitmap(nonRangeSet, bitsBuf); | |
1110 | } | |
1111 | if (firstPlane == 0) { | |
1112 | if (!__CFCSetIsBitmapEqualToRange((const UInt32*)bits, firstChar, (lastPlane == 0 ? lastChar : 0xFFFF), isRangeSetInverted)) return false; | |
1113 | firstPlane = 1; | |
1114 | firstChar = 0; | |
1115 | } else { | |
1116 | if (!__CFCSetIsEqualBitmap((const UInt32*)bits, (isRangeSetInverted ? (const UInt32 *)-1 : NULL))) return false; | |
1117 | firstChar &= 0xFFFF; | |
1118 | } | |
1119 | ||
1120 | lastChar &= 0xFFFF; | |
1121 | ||
1122 | isAnnexInvertStateIdentical = (isRangeSetInverted == __CFCSetAnnexIsInverted(nonRangeSet) ? true : false); | |
1123 | ||
1124 | for (idx = 1;idx < MAX_ANNEX_PLANE;idx++) { | |
1125 | subSet1 = __CFCSetGetAnnexPlaneCharacterSetNoAlloc(nonRangeSet, idx); | |
1126 | if (NULL == subSet1) { | |
1127 | if (idx < firstPlane || idx > lastPlane) { | |
1128 | if (!isAnnexInvertStateIdentical) return false; | |
1129 | } else if (idx > firstPlane && idx < lastPlane) { | |
1130 | if (isAnnexInvertStateIdentical) return false; | |
1131 | } else if (idx == firstPlane) { | |
1132 | if (isAnnexInvertStateIdentical || firstChar || (idx == lastPlane && lastChar != 0xFFFF)) return false; | |
1133 | } else if (idx == lastPlane) { | |
1134 | if (isAnnexInvertStateIdentical || (idx == firstPlane && firstChar) || (lastChar != 0xFFFF)) return false; | |
1135 | } | |
1136 | } else { | |
1137 | if (__CFCSetIsBitmap(subSet1)) { | |
1138 | bits = __CFCSetBitmapBits(subSet1); | |
1139 | } else { | |
1140 | __CFCSetGetBitmap(subSet1, bitsBuf); | |
1141 | bits = bitsBuf; | |
1142 | } | |
1143 | ||
1144 | if (idx < firstPlane || idx > lastPlane) { | |
1145 | if (!__CFCSetIsEqualBitmap((const UInt32*)bits, (isAnnexInvertStateIdentical ? NULL : (const UInt32 *)-1))) return false; | |
1146 | } else if (idx > firstPlane && idx < lastPlane) { | |
1147 | if (!__CFCSetIsEqualBitmap((const UInt32*)bits, (isAnnexInvertStateIdentical ? (const UInt32 *)-1 : NULL))) return false; | |
1148 | } else if (idx == firstPlane) { | |
1149 | if (!__CFCSetIsBitmapEqualToRange((const UInt32*)bits, firstChar, (idx == lastPlane ? lastChar : 0xFFFF), !isAnnexInvertStateIdentical)) return false; | |
1150 | } else if (idx == lastPlane) { | |
1151 | if (!__CFCSetIsBitmapEqualToRange((const UInt32*)bits, (idx == firstPlane ? firstChar : 0), lastChar, !isAnnexInvertStateIdentical)) return false; | |
1152 | } | |
1153 | } | |
1154 | } | |
1155 | return true; | |
1156 | } | |
1157 | ||
bd5b749c A |
1158 | isBitmap1 = __CFCSetIsBitmap((CFCharacterSetRef)cf1); |
1159 | isBitmap2 = __CFCSetIsBitmap((CFCharacterSetRef)cf2); | |
9ce05555 A |
1160 | |
1161 | if (isBitmap1 && isBitmap2) { | |
bd5b749c | 1162 | if (!__CFCSetIsEqualBitmap((const UInt32 *)__CFCSetBitmapBits((CFCharacterSetRef)cf1), (const UInt32 *)__CFCSetBitmapBits((CFCharacterSetRef)cf2))) return false; |
9ce05555 | 1163 | } else if (!isBitmap1 && !isBitmap2) { |
9ce05555 | 1164 | uint8_t bitsBuf2[__kCFBitmapSize]; |
9ce05555 | 1165 | |
bd5b749c A |
1166 | __CFCSetGetBitmap((CFCharacterSetRef)cf1, bitsBuf); |
1167 | __CFCSetGetBitmap((CFCharacterSetRef)cf2, bitsBuf2); | |
9ce05555 A |
1168 | |
1169 | if (!__CFCSetIsEqualBitmap((const UInt32*)bitsBuf, (const UInt32*)bitsBuf2)) { | |
9ce05555 A |
1170 | return false; |
1171 | } | |
9ce05555 A |
1172 | } else { |
1173 | if (isBitmap2) { | |
bd5b749c | 1174 | CFCharacterSetRef tmp = (CFCharacterSetRef)cf2; |
9ce05555 A |
1175 | cf2 = cf1; |
1176 | cf1 = tmp; | |
1177 | } | |
1178 | ||
bd5b749c | 1179 | __CFCSetGetBitmap((CFCharacterSetRef)cf2, bitsBuf); |
9ce05555 | 1180 | |
bd5b749c | 1181 | if (!__CFCSetIsEqualBitmap((const UInt32 *)__CFCSetBitmapBits((CFCharacterSetRef)cf1), (const UInt32 *)bitsBuf)) return false; |
9ce05555 | 1182 | } |
bd5b749c | 1183 | return __CFCSetIsEqualAnnex((CFCharacterSetRef)cf1, (CFCharacterSetRef)cf2); |
9ce05555 A |
1184 | } |
1185 | ||
1186 | static CFHashCode __CFCharacterSetHash(CFTypeRef cf) { | |
bd5b749c A |
1187 | if (!__CFCSetHasHashValue((CFCharacterSetRef)cf)) { |
1188 | if (__CFCSetIsEmpty((CFCharacterSetRef)cf)) { | |
1189 | ((CFMutableCharacterSetRef)cf)->_hashValue = (__CFCSetIsInverted((CFCharacterSetRef)cf) ? ((UInt32)0xFFFFFFFF) : 0); | |
1190 | } else if (__CFCSetIsBitmap( (CFCharacterSetRef) cf )) { | |
1191 | ((CFMutableCharacterSetRef)cf)->_hashValue = CFHashBytes(__CFCSetBitmapBits((CFCharacterSetRef)cf), __kCFBitmapSize); | |
9ce05555 A |
1192 | } else { |
1193 | uint8_t bitsBuf[__kCFBitmapSize]; | |
bd5b749c | 1194 | __CFCSetGetBitmap((CFCharacterSetRef)cf, bitsBuf); |
9ce05555 A |
1195 | ((CFMutableCharacterSetRef)cf)->_hashValue = CFHashBytes(bitsBuf, __kCFBitmapSize); |
1196 | } | |
1197 | __CFCSetPutHasHashValue((CFMutableCharacterSetRef)cf, true); | |
1198 | } | |
1199 | return ((CFCharacterSetRef)cf)->_hashValue; | |
1200 | } | |
1201 | ||
1202 | static CFStringRef __CFCharacterSetCopyDescription(CFTypeRef cf) { | |
1203 | CFMutableStringRef string; | |
1204 | CFIndex idx; | |
1205 | CFIndex length; | |
1206 | ||
bd5b749c A |
1207 | if (__CFCSetIsEmpty((CFCharacterSetRef)cf)) { |
1208 | return (CFStringRef)(__CFCSetIsInverted((CFCharacterSetRef)cf) ? CFRetain(CFSTR("<CFCharacterSet All>")) : CFRetain(CFSTR("<CFCharacterSet Empty>"))); | |
9ce05555 A |
1209 | } |
1210 | ||
bd5b749c | 1211 | switch (__CFCSetClassType((CFCharacterSetRef)cf)) { |
9ce05555 | 1212 | case __kCFCharSetClassBuiltin: |
bd5b749c | 1213 | switch (__CFCSetBuiltinType((CFCharacterSetRef)cf)) { |
cf7d2af9 A |
1214 | case kCFCharacterSetControl: return (CFStringRef)CFRetain(CFSTR("<CFCharacterSet Predefined Control Set>")); |
1215 | case kCFCharacterSetWhitespace : return (CFStringRef)CFRetain(CFSTR("<CFCharacterSet Predefined Whitespace Set>")); | |
1216 | case kCFCharacterSetWhitespaceAndNewline: return (CFStringRef)CFRetain(CFSTR("<CFCharacterSet Predefined WhitespaceAndNewline Set>")); | |
1217 | case kCFCharacterSetDecimalDigit: return (CFStringRef)CFRetain(CFSTR("<CFCharacterSet Predefined DecimalDigit Set>")); | |
1218 | case kCFCharacterSetLetter: return (CFStringRef)CFRetain(CFSTR("<CFCharacterSet Predefined Letter Set>")); | |
1219 | case kCFCharacterSetLowercaseLetter: return (CFStringRef)CFRetain(CFSTR("<CFCharacterSet Predefined LowercaseLetter Set>")); | |
1220 | case kCFCharacterSetUppercaseLetter: return (CFStringRef)CFRetain(CFSTR("<CFCharacterSet Predefined UppercaseLetter Set>")); | |
1221 | case kCFCharacterSetNonBase: return (CFStringRef)CFRetain(CFSTR("<CFCharacterSet Predefined NonBase Set>")); | |
1222 | case kCFCharacterSetDecomposable: return (CFStringRef)CFRetain(CFSTR("<CFCharacterSet Predefined Decomposable Set>")); | |
1223 | case kCFCharacterSetAlphaNumeric: return (CFStringRef)CFRetain(CFSTR("<CFCharacterSet Predefined AlphaNumeric Set>")); | |
1224 | case kCFCharacterSetPunctuation: return (CFStringRef)CFRetain(CFSTR("<CFCharacterSet Predefined Punctuation Set>")); | |
1225 | case kCFCharacterSetIllegal: return (CFStringRef)CFRetain(CFSTR("<CFCharacterSet Predefined Illegal Set>")); | |
1226 | case kCFCharacterSetCapitalizedLetter: return (CFStringRef)CFRetain(CFSTR("<CFCharacterSet Predefined CapitalizedLetter Set>")); | |
1227 | case kCFCharacterSetSymbol: return (CFStringRef)CFRetain(CFSTR("<CFCharacterSet Predefined Symbol Set>")); | |
1228 | case kCFCharacterSetNewline: return (CFStringRef)CFRetain(CFSTR("<CFCharacterSet Predefined Newline Set>")); | |
9ce05555 A |
1229 | } |
1230 | break; | |
1231 | ||
1232 | case __kCFCharSetClassRange: | |
a48904a4 | 1233 | return CFStringCreateWithFormat(CFGetAllocator((CFCharacterSetRef)cf), NULL, CFSTR("<CFCharacterSet Range(%u, %ld)>"), (unsigned int)__CFCSetRangeFirstChar((CFCharacterSetRef)cf), (long)__CFCSetRangeLength((CFCharacterSetRef)cf)); |
9ce05555 | 1234 | |
cf7d2af9 A |
1235 | case __kCFCharSetClassString: { |
1236 | CFStringRef format = CFSTR("<CFCharacterSet Items("); | |
1237 | ||
bd5b749c | 1238 | length = __CFCSetStringLength((CFCharacterSetRef)cf); |
cf7d2af9 A |
1239 | string = CFStringCreateMutable(CFGetAllocator(cf), CFStringGetLength(format) + 7 * length + 2); // length of format + "U+XXXX "(7) * length + ")>"(2) |
1240 | CFStringAppend(string, format); | |
9ce05555 | 1241 | for (idx = 0;idx < length;idx++) { |
a48904a4 | 1242 | CFStringAppendFormat(string, NULL, CFSTR("%sU+%04X"), (idx > 0 ? " " : ""), (unsigned int)((__CFCSetStringBuffer((CFCharacterSetRef)cf))[idx])); |
9ce05555 A |
1243 | } |
1244 | CFStringAppend(string, CFSTR(")>")); | |
1245 | return string; | |
cf7d2af9 | 1246 | } |
9ce05555 A |
1247 | |
1248 | case __kCFCharSetClassBitmap: | |
1249 | case __kCFCharSetClassCompactBitmap: | |
bd5b749c | 1250 | return (CFStringRef)CFRetain(CFSTR("<CFCharacterSet Bitmap>")); // ??? Should generate description for 8k bitmap ? |
9ce05555 A |
1251 | } |
1252 | CFAssert1(0, __kCFLogAssertion, "%s: Internal inconsistency error: unknown character set type", __PRETTY_FUNCTION__); // We should never come here | |
1253 | return NULL; | |
1254 | } | |
1255 | ||
1256 | static void __CFCharacterSetDeallocate(CFTypeRef cf) { | |
1257 | CFAllocatorRef allocator = CFGetAllocator(cf); | |
1258 | ||
bd5b749c A |
1259 | if (__CFCSetIsBuiltin((CFCharacterSetRef)cf) && !__CFCSetIsMutable((CFCharacterSetRef)cf) && !__CFCSetIsInverted((CFCharacterSetRef)cf)) { |
1260 | CFCharacterSetRef sharedSet = CFCharacterSetGetPredefined(__CFCSetBuiltinType((CFCharacterSetRef)cf)); | |
9ce05555 | 1261 | if (sharedSet == cf) { // We're trying to dealloc the builtin set |
bd5b749c | 1262 | CFAssert1(0, __kCFLogAssertion, "%s: Trying to deallocate predefined set. The process is likely to crash.", __PRETTY_FUNCTION__); |
9ce05555 A |
1263 | return; // We never deallocate builtin set |
1264 | } | |
1265 | } | |
1266 | ||
bd5b749c A |
1267 | if (__CFCSetIsString((CFCharacterSetRef)cf) && __CFCSetStringBuffer((CFCharacterSetRef)cf)) CFAllocatorDeallocate(allocator, __CFCSetStringBuffer((CFCharacterSetRef)cf)); |
1268 | else if (__CFCSetIsBitmap((CFCharacterSetRef)cf) && __CFCSetBitmapBits((CFCharacterSetRef)cf)) CFAllocatorDeallocate(allocator, __CFCSetBitmapBits((CFCharacterSetRef)cf)); | |
1269 | else if (__CFCSetIsCompactBitmap((CFCharacterSetRef)cf) && __CFCSetCompactBitmapBits((CFCharacterSetRef)cf)) CFAllocatorDeallocate(allocator, __CFCSetCompactBitmapBits((CFCharacterSetRef)cf)); | |
1270 | __CFCSetDeallocateAnnexPlane((CFCharacterSetRef)cf); | |
9ce05555 A |
1271 | } |
1272 | ||
1273 | static CFTypeID __kCFCharacterSetTypeID = _kCFRuntimeNotATypeID; | |
1274 | ||
1275 | static const CFRuntimeClass __CFCharacterSetClass = { | |
1276 | 0, | |
1277 | "CFCharacterSet", | |
1278 | NULL, // init | |
1279 | NULL, // copy | |
1280 | __CFCharacterSetDeallocate, | |
1281 | __CFCharacterSetEqual, | |
1282 | __CFCharacterSetHash, | |
1283 | NULL, // | |
1284 | __CFCharacterSetCopyDescription | |
1285 | }; | |
1286 | ||
1287 | static bool __CFCheckForExapendedSet = false; | |
1288 | ||
a48904a4 | 1289 | CF_PRIVATE void __CFCharacterSetInitialize(void) { |
d7384798 A |
1290 | static dispatch_once_t initOnce; |
1291 | dispatch_once(&initOnce, ^{ | |
1292 | __kCFCharacterSetTypeID = _CFRuntimeRegisterClass(&__CFCharacterSetClass); // initOnce covered | |
1293 | const char *checkForExpandedSet = __CFgetenv("__CF_DEBUG_EXPANDED_SET"); | |
1294 | if (checkForExpandedSet && (*checkForExpandedSet == 'Y')) __CFCheckForExapendedSet = true; | |
1295 | __CFBuiltinSets = (CFCharacterSetRef *)CFAllocatorAllocate((CFAllocatorRef)CFRetain(__CFGetDefaultAllocator()), sizeof(CFCharacterSetRef) * __kCFLastBuiltinSetID, 0); | |
1296 | memset(__CFBuiltinSets, 0, sizeof(CFCharacterSetRef) * __kCFLastBuiltinSetID); | |
1297 | }); | |
9ce05555 A |
1298 | } |
1299 | ||
1300 | /* Public functions | |
1301 | */ | |
9ce05555 A |
1302 | |
1303 | CFTypeID CFCharacterSetGetTypeID(void) { | |
1304 | return __kCFCharacterSetTypeID; | |
1305 | } | |
1306 | ||
1307 | /*** CharacterSet creation ***/ | |
1308 | /* Functions to create basic immutable characterset. | |
1309 | */ | |
1310 | CFCharacterSetRef CFCharacterSetGetPredefined(CFCharacterSetPredefinedSet theSetIdentifier) { | |
bd5b749c | 1311 | CFCharacterSetRef cset; |
9ce05555 A |
1312 | |
1313 | __CFCSetValidateBuiltinType(theSetIdentifier, __PRETTY_FUNCTION__); | |
1314 | ||
d7384798 | 1315 | OSSpinLockLock(&__CFCharacterSetLock); |
bd5b749c | 1316 | cset = ((NULL != __CFBuiltinSets) ? __CFBuiltinSets[theSetIdentifier - 1] : NULL); |
d7384798 | 1317 | OSSpinLockUnlock(&__CFCharacterSetLock); |
bd5b749c A |
1318 | |
1319 | if (NULL != cset) return cset; | |
9ce05555 A |
1320 | |
1321 | if (!(cset = __CFCSetGenericCreate(kCFAllocatorSystemDefault, __kCFCharSetClassBuiltin))) return NULL; | |
bd5b749c | 1322 | __CFCSetPutBuiltinType((CFMutableCharacterSetRef)cset, theSetIdentifier); |
9ce05555 | 1323 | |
d7384798 | 1324 | OSSpinLockLock(&__CFCharacterSetLock); |
9ce05555 | 1325 | __CFBuiltinSets[theSetIdentifier - 1] = cset; |
d7384798 | 1326 | OSSpinLockUnlock(&__CFCharacterSetLock); |
9ce05555 A |
1327 | |
1328 | return cset; | |
1329 | } | |
1330 | ||
1331 | CFCharacterSetRef CFCharacterSetCreateWithCharactersInRange(CFAllocatorRef allocator, CFRange theRange) { | |
1332 | CFMutableCharacterSetRef cset; | |
1333 | ||
1334 | __CFCSetValidateRange(theRange, __PRETTY_FUNCTION__); | |
1335 | ||
1336 | if (theRange.length) { | |
1337 | if (!(cset = __CFCSetGenericCreate(allocator, __kCFCharSetClassRange))) return NULL; | |
1338 | __CFCSetPutRangeFirstChar(cset, theRange.location); | |
1339 | __CFCSetPutRangeLength(cset, theRange.length); | |
1340 | } else { | |
1341 | if (!(cset = __CFCSetGenericCreate(allocator, __kCFCharSetClassBitmap))) return NULL; | |
1342 | __CFCSetPutBitmapBits(cset, NULL); | |
1343 | __CFCSetPutHasHashValue(cset, true); // _hashValue is 0 | |
1344 | } | |
1345 | ||
1346 | return cset; | |
1347 | } | |
1348 | ||
1349 | static int chcompar(const void *a, const void *b) { | |
1350 | return -(int)(*(UniChar *)b - *(UniChar *)a); | |
1351 | } | |
1352 | ||
1353 | CFCharacterSetRef CFCharacterSetCreateWithCharactersInString(CFAllocatorRef allocator, CFStringRef theString) { | |
1354 | CFIndex length; | |
1355 | ||
1356 | length = CFStringGetLength(theString); | |
1357 | if (length < __kCFStringCharSetMax) { | |
1358 | CFMutableCharacterSetRef cset; | |
1359 | ||
1360 | if (!(cset = __CFCSetGenericCreate(allocator, __kCFCharSetClassString))) return NULL; | |
bd5b749c | 1361 | __CFCSetPutStringBuffer(cset, (UniChar *)CFAllocatorAllocate(CFGetAllocator(cset), __kCFStringCharSetMax * sizeof(UniChar), 0)); |
9ce05555 A |
1362 | __CFCSetPutStringLength(cset, length); |
1363 | CFStringGetCharacters(theString, CFRangeMake(0, length), __CFCSetStringBuffer(cset)); | |
1364 | qsort(__CFCSetStringBuffer(cset), length, sizeof(UniChar), chcompar); | |
cf7d2af9 A |
1365 | |
1366 | if (0 == length) { | |
1367 | __CFCSetPutHasHashValue(cset, true); // _hashValue is 0 | |
1368 | } else if (length > 1) { // Check for surrogate | |
1369 | const UTF16Char *characters = __CFCSetStringBuffer(cset); | |
1370 | const UTF16Char *charactersLimit = characters + length; | |
1371 | ||
1372 | if ((*characters < 0xDC00UL) && (*(charactersLimit - 1) > 0xDBFFUL)) { // might have surrogate chars | |
1373 | while (characters < charactersLimit) { | |
1374 | if (CFStringIsSurrogateHighCharacter(*characters) || CFStringIsSurrogateLowCharacter(*characters)) { | |
1375 | CFRelease(cset); | |
1376 | cset = NULL; | |
1377 | break; | |
1378 | } | |
1379 | ++characters; | |
1380 | } | |
1381 | } | |
1382 | } | |
1383 | if (NULL != cset) return cset; | |
9ce05555 | 1384 | } |
cf7d2af9 A |
1385 | |
1386 | CFMutableCharacterSetRef mcset = CFCharacterSetCreateMutable(allocator); | |
1387 | CFCharacterSetAddCharactersInString(mcset, theString); | |
1388 | __CFCSetMakeCompact(mcset); | |
1389 | __CFCSetPutIsMutable(mcset, false); | |
1390 | return mcset; | |
9ce05555 A |
1391 | } |
1392 | ||
9ce05555 A |
1393 | CFCharacterSetRef CFCharacterSetCreateWithBitmapRepresentation(CFAllocatorRef allocator, CFDataRef theData) { |
1394 | CFMutableCharacterSetRef cset; | |
1395 | CFIndex length; | |
1396 | ||
1397 | if (!(cset = __CFCSetGenericCreate(allocator, __kCFCharSetClassBitmap))) return NULL; | |
1398 | ||
1399 | if (theData && (length = CFDataGetLength(theData)) > 0) { | |
1400 | uint8_t *bitmap; | |
1401 | uint8_t *cBitmap; | |
1402 | ||
1403 | if (length < __kCFBitmapSize) { | |
bd5b749c | 1404 | bitmap = (uint8_t *)CFAllocatorAllocate(allocator, __kCFBitmapSize, 0); |
9ce05555 A |
1405 | memmove(bitmap, CFDataGetBytePtr(theData), length); |
1406 | memset(bitmap + length, 0, __kCFBitmapSize - length); | |
1407 | ||
1408 | cBitmap = __CFCreateCompactBitmap(allocator, bitmap); | |
1409 | ||
1410 | if (cBitmap == NULL) { | |
1411 | __CFCSetPutBitmapBits(cset, bitmap); | |
1412 | } else { | |
1413 | CFAllocatorDeallocate(allocator, bitmap); | |
1414 | __CFCSetPutCompactBitmapBits(cset, cBitmap); | |
1415 | __CFCSetPutClassType(cset, __kCFCharSetClassCompactBitmap); | |
1416 | } | |
1417 | } else { | |
1418 | cBitmap = __CFCreateCompactBitmap(allocator, CFDataGetBytePtr(theData)); | |
1419 | ||
1420 | if (cBitmap == NULL) { | |
bd5b749c | 1421 | bitmap = (uint8_t *)CFAllocatorAllocate(allocator, __kCFBitmapSize, 0); |
9ce05555 A |
1422 | memmove(bitmap, CFDataGetBytePtr(theData), __kCFBitmapSize); |
1423 | ||
1424 | __CFCSetPutBitmapBits(cset, bitmap); | |
1425 | } else { | |
1426 | __CFCSetPutCompactBitmapBits(cset, cBitmap); | |
1427 | __CFCSetPutClassType(cset, __kCFCharSetClassCompactBitmap); | |
1428 | } | |
1429 | ||
1430 | if (length > __kCFBitmapSize) { | |
1431 | CFMutableCharacterSetRef annexSet; | |
bd5b749c | 1432 | const uint8_t *bytes = CFDataGetBytePtr(theData) + __kCFBitmapSize; |
9ce05555 A |
1433 | |
1434 | length -= __kCFBitmapSize; | |
1435 | ||
1436 | while (length > 1) { | |
1437 | annexSet = (CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSet(cset, *(bytes++)); | |
1438 | --length; // Decrement the plane no byte | |
1439 | ||
1440 | if (length < __kCFBitmapSize) { | |
bd5b749c | 1441 | bitmap = (uint8_t *)CFAllocatorAllocate(allocator, __kCFBitmapSize, 0); |
9ce05555 A |
1442 | memmove(bitmap, bytes, length); |
1443 | memset(bitmap + length, 0, __kCFBitmapSize - length); | |
1444 | ||
1445 | cBitmap = __CFCreateCompactBitmap(allocator, bitmap); | |
1446 | ||
1447 | if (cBitmap == NULL) { | |
1448 | __CFCSetPutBitmapBits(annexSet, bitmap); | |
1449 | } else { | |
1450 | CFAllocatorDeallocate(allocator, bitmap); | |
1451 | __CFCSetPutCompactBitmapBits(annexSet, cBitmap); | |
1452 | __CFCSetPutClassType(annexSet, __kCFCharSetClassCompactBitmap); | |
1453 | } | |
1454 | } else { | |
1455 | cBitmap = __CFCreateCompactBitmap(allocator, bytes); | |
1456 | ||
1457 | if (cBitmap == NULL) { | |
bd5b749c | 1458 | bitmap = (uint8_t *)CFAllocatorAllocate(allocator, __kCFBitmapSize, 0); |
9ce05555 A |
1459 | memmove(bitmap, bytes, __kCFBitmapSize); |
1460 | ||
1461 | __CFCSetPutBitmapBits(annexSet, bitmap); | |
1462 | } else { | |
1463 | __CFCSetPutCompactBitmapBits(annexSet, cBitmap); | |
1464 | __CFCSetPutClassType(annexSet, __kCFCharSetClassCompactBitmap); | |
1465 | } | |
1466 | } | |
1467 | length -= __kCFBitmapSize; | |
1468 | bytes += __kCFBitmapSize; | |
1469 | } | |
1470 | } | |
1471 | } | |
1472 | } else { | |
1473 | __CFCSetPutBitmapBits(cset, NULL); | |
1474 | __CFCSetPutHasHashValue(cset, true); // Hash value is 0 | |
1475 | } | |
1476 | ||
1477 | return cset; | |
1478 | } | |
1479 | ||
1480 | CFCharacterSetRef CFCharacterSetCreateInvertedSet(CFAllocatorRef alloc, CFCharacterSetRef theSet) { | |
1481 | CFMutableCharacterSetRef cset; | |
1482 | ||
856091c5 | 1483 | CF_OBJC_FUNCDISPATCHV(__kCFCharacterSetTypeID, CFCharacterSetRef , (NSCharacterSet *)theSet, invertedSet); |
9ce05555 A |
1484 | |
1485 | cset = CFCharacterSetCreateMutableCopy(alloc, theSet); | |
1486 | CFCharacterSetInvert(cset); | |
1487 | __CFCSetPutIsMutable(cset, false); | |
1488 | ||
1489 | return cset; | |
1490 | } | |
1491 | ||
1492 | /* Functions to create mutable characterset. | |
1493 | */ | |
1494 | CFMutableCharacterSetRef CFCharacterSetCreateMutable(CFAllocatorRef allocator) { | |
1495 | CFMutableCharacterSetRef cset; | |
1496 | ||
1497 | if (!(cset = __CFCSetGenericCreate(allocator, __kCFCharSetClassBitmap| __kCFCharSetIsMutable))) return NULL; | |
1498 | __CFCSetPutBitmapBits(cset, NULL); | |
1499 | __CFCSetPutHasHashValue(cset, true); // Hash value is 0 | |
1500 | ||
1501 | return cset; | |
1502 | } | |
1503 | ||
cf7d2af9 | 1504 | static CFMutableCharacterSetRef __CFCharacterSetCreateCopy(CFAllocatorRef alloc, CFCharacterSetRef theSet, bool isMutable) { |
9ce05555 A |
1505 | CFMutableCharacterSetRef cset; |
1506 | ||
856091c5 | 1507 | CF_OBJC_FUNCDISPATCHV(__kCFCharacterSetTypeID, CFMutableCharacterSetRef , (NSCharacterSet *)theSet, mutableCopy); |
9ce05555 A |
1508 | |
1509 | __CFGenericValidateType(theSet, __kCFCharacterSetTypeID); | |
1510 | ||
1511 | if (!isMutable && !__CFCSetIsMutable(theSet)) { | |
1512 | return (CFMutableCharacterSetRef)CFRetain(theSet); | |
1513 | } | |
1514 | ||
1515 | cset = CFCharacterSetCreateMutable(alloc); | |
1516 | ||
1517 | __CFCSetPutClassType(cset, __CFCSetClassType(theSet)); | |
1518 | __CFCSetPutHasHashValue(cset, __CFCSetHasHashValue(theSet)); | |
1519 | __CFCSetPutIsInverted(cset, __CFCSetIsInverted(theSet)); | |
1520 | cset->_hashValue = theSet->_hashValue; | |
1521 | ||
1522 | switch (__CFCSetClassType(theSet)) { | |
1523 | case __kCFCharSetClassBuiltin: | |
1524 | __CFCSetPutBuiltinType(cset, __CFCSetBuiltinType(theSet)); | |
1525 | break; | |
1526 | ||
1527 | case __kCFCharSetClassRange: | |
1528 | __CFCSetPutRangeFirstChar(cset, __CFCSetRangeFirstChar(theSet)); | |
1529 | __CFCSetPutRangeLength(cset, __CFCSetRangeLength(theSet)); | |
1530 | break; | |
1531 | ||
1532 | case __kCFCharSetClassString: | |
bd5b749c A |
1533 | __CFCSetPutStringBuffer(cset, (UniChar *)CFAllocatorAllocate(alloc, __kCFStringCharSetMax * sizeof(UniChar), 0)); |
1534 | ||
9ce05555 A |
1535 | __CFCSetPutStringLength(cset, __CFCSetStringLength(theSet)); |
1536 | memmove(__CFCSetStringBuffer(cset), __CFCSetStringBuffer(theSet), __CFCSetStringLength(theSet) * sizeof(UniChar)); | |
1537 | break; | |
1538 | ||
1539 | case __kCFCharSetClassBitmap: | |
1540 | if (__CFCSetBitmapBits(theSet)) { | |
1541 | uint8_t * bitmap = (isMutable ? NULL : __CFCreateCompactBitmap(alloc, __CFCSetBitmapBits(theSet))); | |
1542 | ||
1543 | if (bitmap == NULL) { | |
bd5b749c | 1544 | bitmap = (uint8_t *)CFAllocatorAllocate(alloc, sizeof(uint8_t) * __kCFBitmapSize, 0); |
9ce05555 A |
1545 | memmove(bitmap, __CFCSetBitmapBits(theSet), __kCFBitmapSize); |
1546 | __CFCSetPutBitmapBits(cset, bitmap); | |
1547 | } else { | |
1548 | __CFCSetPutCompactBitmapBits(cset, bitmap); | |
1549 | __CFCSetPutClassType(cset, __kCFCharSetClassCompactBitmap); | |
1550 | } | |
1551 | } else { | |
1552 | __CFCSetPutBitmapBits(cset, NULL); | |
1553 | } | |
1554 | break; | |
1555 | ||
1556 | case __kCFCharSetClassCompactBitmap: { | |
1557 | const uint8_t *compactBitmap = __CFCSetCompactBitmapBits(theSet); | |
1558 | ||
1559 | if (compactBitmap) { | |
1560 | uint32_t size = __CFCSetGetCompactBitmapSize(compactBitmap); | |
bd5b749c | 1561 | uint8_t *newBitmap = (uint8_t *)CFAllocatorAllocate(alloc, size, 0); |
9ce05555 A |
1562 | |
1563 | memmove(newBitmap, compactBitmap, size); | |
1564 | __CFCSetPutCompactBitmapBits(cset, newBitmap); | |
1565 | } | |
1566 | } | |
1567 | break; | |
1568 | ||
1569 | default: | |
1570 | CFAssert1(0, __kCFLogAssertion, "%s: Internal inconsistency error: unknown character set type", __PRETTY_FUNCTION__); // We should never come here | |
1571 | } | |
1572 | if (__CFCSetHasNonBMPPlane(theSet)) { | |
1573 | CFMutableCharacterSetRef annexPlane; | |
1574 | int idx; | |
1575 | ||
1576 | for (idx = 1;idx <= MAX_ANNEX_PLANE;idx++) { | |
1577 | if ((annexPlane = (CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSetNoAlloc(theSet, idx))) { | |
1578 | annexPlane = __CFCharacterSetCreateCopy(alloc, annexPlane, isMutable); | |
1579 | __CFCSetPutCharacterSetToAnnexPlane(cset, annexPlane, idx); | |
1580 | CFRelease(annexPlane); | |
1581 | } | |
1582 | } | |
1583 | __CFCSetAnnexSetIsInverted(cset, __CFCSetAnnexIsInverted(theSet)); | |
1584 | } else if (__CFCSetAnnexIsInverted(theSet)) { | |
9ce05555 A |
1585 | __CFCSetAnnexSetIsInverted(cset, true); |
1586 | } | |
1587 | ||
1588 | return cset; | |
1589 | } | |
1590 | ||
1591 | CFCharacterSetRef CFCharacterSetCreateCopy(CFAllocatorRef alloc, CFCharacterSetRef theSet) { | |
1592 | return __CFCharacterSetCreateCopy(alloc, theSet, false); | |
1593 | } | |
1594 | ||
1595 | CFMutableCharacterSetRef CFCharacterSetCreateMutableCopy(CFAllocatorRef alloc, CFCharacterSetRef theSet) { | |
1596 | return __CFCharacterSetCreateCopy(alloc, theSet, true); | |
1597 | } | |
1598 | ||
1599 | /*** Basic accessors ***/ | |
1600 | Boolean CFCharacterSetIsCharacterMember(CFCharacterSetRef theSet, UniChar theChar) { | |
bd5b749c A |
1601 | CFIndex length; |
1602 | Boolean isInverted; | |
1603 | Boolean result = false; | |
1604 | ||
856091c5 | 1605 | CF_OBJC_FUNCDISPATCHV(__kCFCharacterSetTypeID, Boolean, (NSCharacterSet *)theSet, longCharacterIsMember:(UTF32Char)theChar); |
bd5b749c A |
1606 | |
1607 | __CFGenericValidateType(theSet, __kCFCharacterSetTypeID); | |
1608 | ||
1609 | isInverted = __CFCSetIsInverted(theSet); | |
1610 | ||
1611 | switch (__CFCSetClassType(theSet)) { | |
1612 | case __kCFCharSetClassBuiltin: | |
1613 | result = (CFUniCharIsMemberOf(theChar, __CFCSetBuiltinType(theSet)) ? !isInverted : isInverted); | |
1614 | break; | |
1615 | ||
1616 | case __kCFCharSetClassRange: | |
1617 | length = __CFCSetRangeLength(theSet); | |
1618 | result = (length && __CFCSetRangeFirstChar(theSet) <= theChar && theChar < __CFCSetRangeFirstChar(theSet) + length ? !isInverted : isInverted); | |
1619 | break; | |
1620 | ||
1621 | case __kCFCharSetClassString: | |
1622 | result = ((length = __CFCSetStringLength(theSet)) ? (__CFCSetBsearchUniChar(__CFCSetStringBuffer(theSet), length, theChar) ? !isInverted : isInverted) : isInverted); | |
1623 | break; | |
1624 | ||
1625 | case __kCFCharSetClassBitmap: | |
1626 | result = (__CFCSetCompactBitmapBits(theSet) ? (__CFCSetIsMemberBitmap(__CFCSetBitmapBits(theSet), theChar) ? true : false) : isInverted); | |
1627 | break; | |
1628 | ||
1629 | case __kCFCharSetClassCompactBitmap: | |
1630 | result = (__CFCSetCompactBitmapBits(theSet) ? (__CFCSetIsMemberInCompactBitmap(__CFCSetCompactBitmapBits(theSet), theChar) ? true : false) : isInverted); | |
1631 | break; | |
1632 | ||
1633 | default: | |
1634 | CFAssert1(0, __kCFLogAssertion, "%s: Internal inconsistency error: unknown character set type", __PRETTY_FUNCTION__); // We should never come here | |
1635 | break; | |
1636 | } | |
1637 | ||
1638 | return result; | |
9ce05555 A |
1639 | } |
1640 | ||
1641 | Boolean CFCharacterSetIsLongCharacterMember(CFCharacterSetRef theSet, UTF32Char theChar) { | |
1642 | CFIndex length; | |
1643 | UInt32 plane = (theChar >> 16); | |
1644 | Boolean isAnnexInverted = false; | |
1645 | Boolean isInverted; | |
1646 | Boolean result = false; | |
1647 | ||
856091c5 | 1648 | CF_OBJC_FUNCDISPATCHV(__kCFCharacterSetTypeID, Boolean, (NSCharacterSet *)theSet, longCharacterIsMember:(UTF32Char)theChar); |
9ce05555 A |
1649 | |
1650 | __CFGenericValidateType(theSet, __kCFCharacterSetTypeID); | |
1651 | ||
1652 | if (plane) { | |
1653 | CFCharacterSetRef annexPlane; | |
1654 | ||
1655 | if (__CFCSetIsBuiltin(theSet)) { | |
1656 | isInverted = __CFCSetIsInverted(theSet); | |
1657 | return (CFUniCharIsMemberOf(theChar, __CFCSetBuiltinType(theSet)) ? !isInverted : isInverted); | |
1658 | } | |
1659 | ||
1660 | isAnnexInverted = __CFCSetAnnexIsInverted(theSet); | |
1661 | ||
1662 | if ((annexPlane = __CFCSetGetAnnexPlaneCharacterSetNoAlloc(theSet, plane)) == NULL) { | |
1663 | if (!__CFCSetHasNonBMPPlane(theSet) && __CFCSetIsRange(theSet)) { | |
1664 | isInverted = __CFCSetIsInverted(theSet); | |
1665 | length = __CFCSetRangeLength(theSet); | |
1666 | return (length && __CFCSetRangeFirstChar(theSet) <= theChar && theChar < __CFCSetRangeFirstChar(theSet) + length ? !isInverted : isInverted); | |
1667 | } else { | |
1668 | return (isAnnexInverted ? true : false); | |
1669 | } | |
1670 | } else { | |
1671 | theSet = annexPlane; | |
1672 | theChar &= 0xFFFF; | |
1673 | } | |
1674 | } | |
1675 | ||
1676 | isInverted = __CFCSetIsInverted(theSet); | |
1677 | ||
1678 | switch (__CFCSetClassType(theSet)) { | |
1679 | case __kCFCharSetClassBuiltin: | |
1680 | result = (CFUniCharIsMemberOf(theChar, __CFCSetBuiltinType(theSet)) ? !isInverted : isInverted); | |
1681 | break; | |
1682 | ||
1683 | case __kCFCharSetClassRange: | |
1684 | length = __CFCSetRangeLength(theSet); | |
1685 | result = (length && __CFCSetRangeFirstChar(theSet) <= theChar && theChar < __CFCSetRangeFirstChar(theSet) + length ? !isInverted : isInverted); | |
1686 | break; | |
1687 | ||
1688 | case __kCFCharSetClassString: | |
1689 | result = ((length = __CFCSetStringLength(theSet)) ? (__CFCSetBsearchUniChar(__CFCSetStringBuffer(theSet), length, theChar) ? !isInverted : isInverted) : isInverted); | |
1690 | break; | |
1691 | ||
1692 | case __kCFCharSetClassBitmap: | |
1693 | result = (__CFCSetCompactBitmapBits(theSet) ? (__CFCSetIsMemberBitmap(__CFCSetBitmapBits(theSet), theChar) ? true : false) : isInverted); | |
1694 | break; | |
1695 | ||
1696 | case __kCFCharSetClassCompactBitmap: | |
1697 | result = (__CFCSetCompactBitmapBits(theSet) ? (__CFCSetIsMemberInCompactBitmap(__CFCSetCompactBitmapBits(theSet), theChar) ? true : false) : isInverted); | |
1698 | break; | |
1699 | ||
1700 | default: | |
1701 | CFAssert1(0, __kCFLogAssertion, "%s: Internal inconsistency error: unknown character set type", __PRETTY_FUNCTION__); // We should never come here | |
1702 | return false; // To make compiler happy | |
1703 | } | |
1704 | ||
1705 | return (result ? !isAnnexInverted : isAnnexInverted); | |
1706 | } | |
1707 | ||
1708 | Boolean CFCharacterSetIsSurrogatePairMember(CFCharacterSetRef theSet, UniChar surrogateHigh, UniChar surrogateLow) { | |
1709 | return CFCharacterSetIsLongCharacterMember(theSet, CFCharacterSetGetLongCharacterForSurrogatePair(surrogateHigh, surrogateLow)); | |
1710 | } | |
1711 | ||
1712 | ||
bd5b749c | 1713 | static inline CFCharacterSetRef __CFCharacterSetGetExpandedSetForNSCharacterSet(const void *characterSet) { |
856091c5 | 1714 | CF_OBJC_FUNCDISPATCHV(__kCFCharacterSetTypeID, CFCharacterSetRef , (NSCharacterSet *)characterSet, _expandedCFCharacterSet); |
9ce05555 A |
1715 | return NULL; |
1716 | } | |
1717 | ||
1718 | Boolean CFCharacterSetIsSupersetOfSet(CFCharacterSetRef theSet, CFCharacterSetRef theOtherSet) { | |
1719 | CFMutableCharacterSetRef copy; | |
1720 | CFCharacterSetRef expandedSet = NULL; | |
1721 | CFCharacterSetRef expandedOtherSet = NULL; | |
1722 | Boolean result; | |
1723 | ||
1724 | if ((!CF_IS_OBJC(__kCFCharacterSetTypeID, theSet) || (expandedSet = __CFCharacterSetGetExpandedSetForNSCharacterSet(theSet))) && (!CF_IS_OBJC(__kCFCharacterSetTypeID, theOtherSet) || (expandedOtherSet = __CFCharacterSetGetExpandedSetForNSCharacterSet(theOtherSet)))) { // Really CF, we can do some trick here | |
1725 | if (expandedSet) theSet = expandedSet; | |
1726 | if (expandedOtherSet) theOtherSet = expandedOtherSet; | |
1727 | ||
1728 | __CFGenericValidateType(theSet, __kCFCharacterSetTypeID); | |
1729 | __CFGenericValidateType(theOtherSet, __kCFCharacterSetTypeID); | |
1730 | ||
1731 | if (__CFCSetIsEmpty(theSet)) { | |
1732 | if (__CFCSetIsInverted(theSet)) { | |
1733 | return TRUE; // Inverted empty set covers all range | |
1734 | } else if (!__CFCSetIsEmpty(theOtherSet) || __CFCSetIsInverted(theOtherSet)) { | |
1735 | return FALSE; | |
1736 | } | |
1737 | } else if (__CFCSetIsEmpty(theOtherSet) && !__CFCSetIsInverted(theOtherSet)) { | |
1738 | return TRUE; | |
1739 | } else { | |
1740 | if (__CFCSetIsBuiltin(theSet) || __CFCSetIsBuiltin(theOtherSet)) { | |
1741 | if (__CFCSetClassType(theSet) == __CFCSetClassType(theOtherSet) && __CFCSetBuiltinType(theSet) == __CFCSetBuiltinType(theOtherSet) && !__CFCSetIsInverted(theSet) && !__CFCSetIsInverted(theOtherSet)) return TRUE; | |
1742 | } else if (__CFCSetIsRange(theSet) || __CFCSetIsRange(theOtherSet)) { | |
1743 | if (__CFCSetClassType(theSet) == __CFCSetClassType(theOtherSet)) { | |
1744 | if (__CFCSetIsInverted(theSet)) { | |
1745 | if (__CFCSetIsInverted(theOtherSet)) { | |
1746 | return (__CFCSetRangeFirstChar(theOtherSet) > __CFCSetRangeFirstChar(theSet) || (__CFCSetRangeFirstChar(theSet) + __CFCSetRangeLength(theSet)) > (__CFCSetRangeFirstChar(theOtherSet) + __CFCSetRangeLength(theOtherSet)) ? FALSE : TRUE); | |
1747 | } else { | |
1748 | return ((__CFCSetRangeFirstChar(theOtherSet) + __CFCSetRangeLength(theOtherSet)) <= __CFCSetRangeFirstChar(theSet) || (__CFCSetRangeFirstChar(theSet) + __CFCSetRangeLength(theSet)) <= __CFCSetRangeFirstChar(theOtherSet) ? TRUE : FALSE); | |
1749 | } | |
1750 | } else { | |
1751 | if (__CFCSetIsInverted(theOtherSet)) { | |
1752 | return ((__CFCSetRangeFirstChar(theSet) == 0 && __CFCSetRangeLength(theSet) == 0x110000) || (__CFCSetRangeFirstChar(theOtherSet) == 0 && (UInt32)__CFCSetRangeLength(theOtherSet) <= __CFCSetRangeFirstChar(theSet)) || ((__CFCSetRangeFirstChar(theSet) + __CFCSetRangeLength(theSet)) <= __CFCSetRangeFirstChar(theOtherSet) && (__CFCSetRangeFirstChar(theOtherSet) + __CFCSetRangeLength(theOtherSet)) == 0x110000) ? TRUE : FALSE); | |
1753 | } else { | |
1754 | return (__CFCSetRangeFirstChar(theOtherSet) < __CFCSetRangeFirstChar(theSet) || (__CFCSetRangeFirstChar(theSet) + __CFCSetRangeLength(theSet)) < (__CFCSetRangeFirstChar(theOtherSet) + __CFCSetRangeLength(theOtherSet)) ? FALSE : TRUE); | |
1755 | } | |
1756 | } | |
1757 | } | |
1758 | } else { | |
1759 | UInt32 theSetAnnexMask = __CFCSetAnnexValidEntriesBitmap(theSet); | |
1760 | UInt32 theOtherSetAnnexMask = __CFCSetAnnexValidEntriesBitmap(theOtherSet); | |
1761 | Boolean isTheSetAnnexInverted = __CFCSetAnnexIsInverted(theSet); | |
1762 | Boolean isTheOtherSetAnnexInverted = __CFCSetAnnexIsInverted(theOtherSet); | |
1763 | uint8_t theSetBuffer[__kCFBitmapSize]; | |
1764 | uint8_t theOtherSetBuffer[__kCFBitmapSize]; | |
1765 | ||
1766 | // We mask plane 1 to plane 16 | |
cf7d2af9 A |
1767 | if (isTheSetAnnexInverted) theSetAnnexMask = (~theSetAnnexMask) & (0xFFFF << 1); |
1768 | if (isTheOtherSetAnnexInverted) theOtherSetAnnexMask = (~theOtherSetAnnexMask) & (0xFFFF << 1); | |
9ce05555 A |
1769 | |
1770 | __CFCSetGetBitmap(theSet, theSetBuffer); | |
1771 | __CFCSetGetBitmap(theOtherSet, theOtherSetBuffer); | |
1772 | ||
1773 | if (!__CFCSetIsBitmapSupersetOfBitmap((const UInt32 *)theSetBuffer, (const UInt32 *)theOtherSetBuffer, FALSE, FALSE)) return FALSE; | |
1774 | ||
1775 | if (theOtherSetAnnexMask) { | |
1776 | CFCharacterSetRef theSetAnnex; | |
1777 | CFCharacterSetRef theOtherSetAnnex; | |
1778 | uint32_t idx; | |
1779 | ||
1780 | if ((theSetAnnexMask & theOtherSetAnnexMask) != theOtherSetAnnexMask) return FALSE; | |
1781 | ||
1782 | for (idx = 1;idx <= 16;idx++) { | |
1783 | theSetAnnex = __CFCSetGetAnnexPlaneCharacterSetNoAlloc(theSet, idx); | |
1784 | if (NULL == theSetAnnex) continue; // This case is already handled by the mask above | |
1785 | ||
1786 | theOtherSetAnnex = __CFCSetGetAnnexPlaneCharacterSetNoAlloc(theOtherSet, idx); | |
1787 | ||
1788 | if (NULL == theOtherSetAnnex) { | |
1789 | if (isTheOtherSetAnnexInverted) { | |
1790 | __CFCSetGetBitmap(theSetAnnex, theSetBuffer); | |
1791 | if (!__CFCSetIsEqualBitmap((const UInt32 *)theSetBuffer, (isTheSetAnnexInverted ? NULL : (const UInt32 *)-1))) return FALSE; | |
1792 | } | |
1793 | } else { | |
1794 | __CFCSetGetBitmap(theSetAnnex, theSetBuffer); | |
1795 | __CFCSetGetBitmap(theOtherSetAnnex, theOtherSetBuffer); | |
1796 | if (!__CFCSetIsBitmapSupersetOfBitmap((const UInt32 *)theSetBuffer, (const UInt32 *)theOtherSetBuffer, isTheSetAnnexInverted, isTheOtherSetAnnexInverted)) return FALSE; | |
1797 | } | |
1798 | } | |
1799 | } | |
1800 | ||
1801 | return TRUE; | |
1802 | } | |
1803 | } | |
1804 | } | |
1805 | ||
bd5b749c | 1806 | copy = CFCharacterSetCreateMutableCopy(kCFAllocatorSystemDefault, theSet); |
9ce05555 A |
1807 | CFCharacterSetIntersect(copy, theOtherSet); |
1808 | result = __CFCharacterSetEqual(copy, theOtherSet); | |
1809 | CFRelease(copy); | |
1810 | ||
1811 | return result; | |
1812 | } | |
1813 | ||
1814 | Boolean CFCharacterSetHasMemberInPlane(CFCharacterSetRef theSet, CFIndex thePlane) { | |
1815 | Boolean isInverted = __CFCSetIsInverted(theSet); | |
1816 | ||
856091c5 | 1817 | CF_OBJC_FUNCDISPATCHV(__kCFCharacterSetTypeID, Boolean, (NSCharacterSet *)theSet, hasMemberInPlane:(uint8_t)thePlane); |
9ce05555 A |
1818 | |
1819 | if (__CFCSetIsEmpty(theSet)) { | |
1820 | return (isInverted ? TRUE : FALSE); | |
1821 | } else if (__CFCSetIsBuiltin(theSet)) { | |
1822 | CFCharacterSetPredefinedSet type = __CFCSetBuiltinType(theSet); | |
1823 | ||
1824 | if (type == kCFCharacterSetControl) { | |
1825 | if (isInverted || (thePlane == 14)) { | |
1826 | return TRUE; // There is no plane that covers all values || Plane 14 has language tags | |
1827 | } else { | |
1828 | return (CFUniCharGetBitmapPtrForPlane(type, thePlane) ? TRUE : FALSE); | |
1829 | } | |
bd5b749c | 1830 | } else if ((type < kCFCharacterSetDecimalDigit) || (type == kCFCharacterSetNewline)) { |
9ce05555 A |
1831 | return (thePlane && !isInverted ? FALSE : TRUE); |
1832 | } else if (__CFCSetBuiltinType(theSet) == kCFCharacterSetIllegal) { | |
1833 | return (isInverted ? (thePlane < 3 || thePlane > 13 ? TRUE : FALSE) : TRUE); // This is according to Unicode 3.1 | |
1834 | } else { | |
1835 | if (isInverted) { | |
1836 | return TRUE; // There is no plane that covers all values | |
1837 | } else { | |
1838 | return (CFUniCharGetBitmapPtrForPlane(type, thePlane) ? TRUE : FALSE); | |
1839 | } | |
1840 | } | |
1841 | } else if (__CFCSetIsRange(theSet)) { | |
1842 | UTF32Char firstChar = __CFCSetRangeFirstChar(theSet); | |
1843 | UTF32Char lastChar = (firstChar + __CFCSetRangeLength(theSet) - 1); | |
1844 | CFIndex firstPlane = firstChar >> 16; | |
1845 | CFIndex lastPlane = lastChar >> 16; | |
1846 | ||
1847 | if (isInverted) { | |
1848 | if (thePlane < firstPlane || thePlane > lastPlane) { | |
1849 | return TRUE; | |
1850 | } else if (thePlane > firstPlane && thePlane < lastPlane) { | |
1851 | return FALSE; | |
1852 | } else { | |
1853 | firstChar &= 0xFFFF; | |
1854 | lastChar &= 0xFFFF; | |
1855 | if (thePlane == firstPlane) { | |
1856 | return (firstChar || (firstPlane == lastPlane && lastChar != 0xFFFF) ? TRUE : FALSE); | |
1857 | } else { | |
1858 | return (lastChar != 0xFFFF || (firstPlane == lastPlane && firstChar) ? TRUE : FALSE); | |
1859 | } | |
1860 | } | |
1861 | } else { | |
1862 | return (thePlane < firstPlane || thePlane > lastPlane ? FALSE : TRUE); | |
1863 | } | |
1864 | } else { | |
1865 | if (thePlane == 0) { | |
1866 | switch (__CFCSetClassType(theSet)) { | |
1867 | case __kCFCharSetClassString: if (!__CFCSetStringLength(theSet)) return isInverted; break; | |
1868 | case __kCFCharSetClassCompactBitmap: return (__CFCSetCompactBitmapBits(theSet) ? TRUE : FALSE); break; | |
1869 | case __kCFCharSetClassBitmap: return (__CFCSetBitmapBits(theSet) ? TRUE : FALSE); break; | |
1870 | } | |
1871 | return TRUE; | |
1872 | } else { | |
1873 | CFCharacterSetRef annex = __CFCSetGetAnnexPlaneCharacterSetNoAlloc(theSet, thePlane); | |
1874 | if (annex) { | |
1875 | if (__CFCSetIsRange(annex)) { | |
1876 | return (__CFCSetAnnexIsInverted(theSet) && (__CFCSetRangeFirstChar(annex) == 0) && (__CFCSetRangeLength(annex) == 0x10000) ? FALSE : TRUE); | |
1877 | } else if (__CFCSetIsBitmap(annex)) { | |
1878 | return (__CFCSetAnnexIsInverted(theSet) && __CFCSetIsEqualBitmap((const UInt32 *)__CFCSetBitmapBits(annex), (const UInt32 *)-1) ? FALSE : TRUE); | |
1879 | } else { | |
1880 | uint8_t bitsBuf[__kCFBitmapSize]; | |
1881 | __CFCSetGetBitmap(annex, bitsBuf); | |
1882 | return (__CFCSetAnnexIsInverted(theSet) && __CFCSetIsEqualBitmap((const UInt32 *)bitsBuf, (const UInt32 *)-1) ? FALSE : TRUE); | |
1883 | } | |
1884 | } else { | |
1885 | return __CFCSetAnnexIsInverted(theSet); | |
1886 | } | |
1887 | } | |
1888 | } | |
1889 | ||
1890 | return FALSE; | |
1891 | } | |
1892 | ||
1893 | ||
1894 | CFDataRef CFCharacterSetCreateBitmapRepresentation(CFAllocatorRef alloc, CFCharacterSetRef theSet) { | |
1895 | CFMutableDataRef data; | |
1896 | int numNonBMPPlanes = 0; | |
1897 | int planeIndices[MAX_ANNEX_PLANE]; | |
1898 | int idx; | |
1899 | int length; | |
1900 | bool isAnnexInverted; | |
1901 | ||
856091c5 | 1902 | CF_OBJC_FUNCDISPATCHV(__kCFCharacterSetTypeID, CFDataRef , (NSCharacterSet *)theSet, _retainedBitmapRepresentation); |
9ce05555 A |
1903 | |
1904 | __CFGenericValidateType(theSet, __kCFCharacterSetTypeID); | |
1905 | ||
bd5b749c | 1906 | isAnnexInverted = (__CFCSetAnnexIsInverted(theSet) != 0); |
9ce05555 A |
1907 | |
1908 | if (__CFCSetHasNonBMPPlane(theSet)) { | |
1909 | for (idx = 1;idx <= MAX_ANNEX_PLANE;idx++) { | |
1910 | if (isAnnexInverted || __CFCSetGetAnnexPlaneCharacterSetNoAlloc(theSet, idx)) { | |
1911 | planeIndices[numNonBMPPlanes++] = idx; | |
1912 | } | |
1913 | } | |
1914 | } else if (__CFCSetIsBuiltin(theSet)) { | |
1915 | numNonBMPPlanes = (__CFCSetIsInverted(theSet) ? MAX_ANNEX_PLANE : CFUniCharGetNumberOfPlanes(__CFCSetBuiltinType(theSet)) - 1); | |
1916 | } else if (__CFCSetIsRange(theSet)) { | |
1917 | UInt32 firstChar = __CFCSetRangeFirstChar(theSet); | |
1918 | UInt32 lastChar = __CFCSetRangeFirstChar(theSet) + __CFCSetRangeLength(theSet) - 1; | |
1919 | int firstPlane = (firstChar >> 16); | |
1920 | int lastPlane = (lastChar >> 16); | |
bd5b749c | 1921 | bool isInverted = (__CFCSetIsInverted(theSet) != 0); |
9ce05555 A |
1922 | |
1923 | if (lastPlane > 0) { | |
1924 | if (firstPlane == 0) { | |
1925 | firstPlane = 1; | |
1926 | firstChar = 0x10000; | |
1927 | } | |
1928 | numNonBMPPlanes = (lastPlane - firstPlane) + 1; | |
1929 | if (isInverted) { | |
1930 | numNonBMPPlanes = MAX_ANNEX_PLANE - numNonBMPPlanes; | |
1931 | if (firstPlane == lastPlane) { | |
1932 | if (((firstChar & 0xFFFF) > 0) || ((lastChar & 0xFFFF) < 0xFFFF)) ++numNonBMPPlanes; | |
1933 | } else { | |
1934 | if ((firstChar & 0xFFFF) > 0) ++numNonBMPPlanes; | |
1935 | if ((lastChar & 0xFFFF) < 0xFFFF) ++numNonBMPPlanes; | |
1936 | } | |
1937 | } | |
1938 | } else if (isInverted) { | |
1939 | numNonBMPPlanes = MAX_ANNEX_PLANE; | |
1940 | } | |
1941 | } else if (isAnnexInverted) { | |
1942 | numNonBMPPlanes = MAX_ANNEX_PLANE; | |
1943 | } | |
1944 | ||
1945 | length = __kCFBitmapSize + ((__kCFBitmapSize + 1) * numNonBMPPlanes); | |
1946 | data = CFDataCreateMutable(alloc, length); | |
1947 | CFDataSetLength(data, length); | |
1948 | __CFCSetGetBitmap(theSet, CFDataGetMutableBytePtr(data)); | |
1949 | ||
1950 | if (numNonBMPPlanes > 0) { | |
bd5b749c | 1951 | uint8_t *bytes = CFDataGetMutableBytePtr(data) + __kCFBitmapSize; |
9ce05555 A |
1952 | |
1953 | if (__CFCSetHasNonBMPPlane(theSet)) { | |
1954 | CFCharacterSetRef subset; | |
1955 | ||
1956 | for (idx = 0;idx < numNonBMPPlanes;idx++) { | |
1957 | *(bytes++) = planeIndices[idx]; | |
1958 | if ((subset = __CFCSetGetAnnexPlaneCharacterSetNoAlloc(theSet, planeIndices[idx])) == NULL) { | |
1959 | __CFCSetBitmapFastFillWithValue((UInt32 *)bytes, (isAnnexInverted ? 0xFF : 0)); | |
1960 | } else { | |
1961 | __CFCSetGetBitmap(subset, bytes); | |
1962 | if (isAnnexInverted) { | |
1963 | uint32_t count = __kCFBitmapSize / sizeof(uint32_t); | |
1964 | uint32_t *bits = (uint32_t *)bytes; | |
1965 | ||
1966 | while (count-- > 0) { | |
1967 | *bits = ~(*bits); | |
1968 | ++bits; | |
1969 | } | |
1970 | } | |
1971 | } | |
1972 | bytes += __kCFBitmapSize; | |
1973 | } | |
1974 | } else if (__CFCSetIsBuiltin(theSet)) { | |
1975 | UInt8 result; | |
bd5b749c | 1976 | CFIndex delta; |
9ce05555 A |
1977 | Boolean isInverted = __CFCSetIsInverted(theSet); |
1978 | ||
1979 | for (idx = 0;idx < numNonBMPPlanes;idx++) { | |
bd5b749c | 1980 | if ((result = CFUniCharGetBitmapForPlane(__CFCSetBuiltinType(theSet), idx + 1, bytes + 1, (isInverted != 0))) == kCFUniCharBitmapEmpty) continue; |
9ce05555 A |
1981 | *(bytes++) = idx + 1; |
1982 | if (result == kCFUniCharBitmapAll) { | |
1983 | CFIndex bitmapLength = __kCFBitmapSize; | |
1984 | while (bitmapLength-- > 0) *(bytes++) = (uint8_t)0xFF; | |
1985 | } else { | |
1986 | bytes += __kCFBitmapSize; | |
1987 | } | |
1988 | } | |
bd5b749c A |
1989 | delta = bytes - (const uint8_t *)CFDataGetBytePtr(data); |
1990 | if (delta < length) CFDataSetLength(data, delta); | |
9ce05555 A |
1991 | } else if (__CFCSetIsRange(theSet)) { |
1992 | UInt32 firstChar = __CFCSetRangeFirstChar(theSet); | |
1993 | UInt32 lastChar = __CFCSetRangeFirstChar(theSet) + __CFCSetRangeLength(theSet) - 1; | |
1994 | int firstPlane = (firstChar >> 16); | |
1995 | int lastPlane = (lastChar >> 16); | |
1996 | ||
1997 | if (firstPlane == 0) { | |
1998 | firstPlane = 1; | |
1999 | firstChar = 0x10000; | |
2000 | } | |
2001 | if (__CFCSetIsInverted(theSet)) { | |
2002 | // Mask out the plane byte | |
2003 | firstChar &= 0xFFFF; | |
2004 | lastChar &= 0xFFFF; | |
2005 | ||
2006 | for (idx = 1;idx < firstPlane;idx++) { // Fill up until the first plane | |
2007 | *(bytes++) = idx; | |
2008 | __CFCSetBitmapFastFillWithValue((UInt32 *)bytes, 0xFF); | |
2009 | bytes += __kCFBitmapSize; | |
2010 | } | |
2011 | if (firstPlane == lastPlane) { | |
2012 | if ((firstChar > 0) || (lastChar < 0xFFFF)) { | |
2013 | *(bytes++) = idx; | |
2014 | __CFCSetBitmapFastFillWithValue((UInt32 *)bytes, 0xFF); | |
2015 | __CFCSetBitmapRemoveCharactersInRange(bytes, firstChar, lastChar); | |
2016 | bytes += __kCFBitmapSize; | |
2017 | } | |
2018 | } else if (firstPlane < lastPlane) { | |
2019 | if (firstChar > 0) { | |
2020 | *(bytes++) = idx; | |
2021 | __CFCSetBitmapFastFillWithValue((UInt32 *)bytes, 0); | |
2022 | __CFCSetBitmapAddCharactersInRange(bytes, 0, firstChar - 1); | |
2023 | bytes += __kCFBitmapSize; | |
2024 | } | |
2025 | if (lastChar < 0xFFFF) { | |
2026 | *(bytes++) = idx; | |
2027 | __CFCSetBitmapFastFillWithValue((UInt32 *)bytes, 0); | |
2028 | __CFCSetBitmapAddCharactersInRange(bytes, lastChar, 0xFFFF); | |
2029 | bytes += __kCFBitmapSize; | |
2030 | } | |
2031 | } | |
2032 | for (idx = lastPlane + 1;idx <= MAX_ANNEX_PLANE;idx++) { | |
2033 | *(bytes++) = idx; | |
2034 | __CFCSetBitmapFastFillWithValue((UInt32 *)bytes, 0xFF); | |
2035 | bytes += __kCFBitmapSize; | |
2036 | } | |
2037 | } else { | |
2038 | for (idx = firstPlane;idx <= lastPlane;idx++) { | |
2039 | *(bytes++) = idx; | |
2040 | __CFCSetBitmapAddCharactersInRange(bytes, (idx == firstPlane ? firstChar : 0), (idx == lastPlane ? lastChar : 0xFFFF)); | |
2041 | bytes += __kCFBitmapSize; | |
2042 | } | |
2043 | } | |
2044 | } else if (isAnnexInverted) { | |
2045 | for (idx = 1;idx <= MAX_ANNEX_PLANE;idx++) { | |
2046 | *(bytes++) = idx; | |
2047 | __CFCSetBitmapFastFillWithValue((UInt32 *)bytes, 0xFF); | |
2048 | bytes += __kCFBitmapSize; | |
2049 | } | |
2050 | } | |
2051 | } | |
2052 | ||
2053 | return data; | |
2054 | } | |
2055 | ||
2056 | /*** MutableCharacterSet functions ***/ | |
2057 | void CFCharacterSetAddCharactersInRange(CFMutableCharacterSetRef theSet, CFRange theRange) { | |
856091c5 | 2058 | CF_OBJC_FUNCDISPATCHV(__kCFCharacterSetTypeID, void, (NSMutableCharacterSet *)theSet, addCharactersInRange:NSMakeRange(theRange.location, theRange.length)); |
9ce05555 A |
2059 | |
2060 | __CFCSetValidateTypeAndMutability(theSet, __PRETTY_FUNCTION__); | |
2061 | __CFCSetValidateRange(theRange, __PRETTY_FUNCTION__); | |
2062 | ||
a48904a4 A |
2063 | if (__CFCSetIsBuiltin((CFCharacterSetRef)theSet) && !__CFCSetIsMutable((CFCharacterSetRef)theSet) && !__CFCSetIsInverted((CFCharacterSetRef)theSet)) { |
2064 | CFCharacterSetRef sharedSet = CFCharacterSetGetPredefined(__CFCSetBuiltinType((CFCharacterSetRef)theSet)); | |
2065 | if (sharedSet == theSet) { // We're trying to dealloc the builtin set | |
2066 | CFAssert1(0, __kCFLogAssertion, "%s: Trying to mutable predefined set.", __PRETTY_FUNCTION__); | |
2067 | return; // We don't mutate builtin set | |
2068 | } | |
2069 | } | |
2070 | ||
9ce05555 A |
2071 | if (!theRange.length || (__CFCSetIsInverted(theSet) && __CFCSetIsEmpty(theSet))) return; // Inverted && empty set contains all char |
2072 | ||
2073 | if (!__CFCSetIsInverted(theSet)) { | |
2074 | if (__CFCSetIsEmpty(theSet)) { | |
2075 | __CFCSetPutClassType(theSet, __kCFCharSetClassRange); | |
2076 | __CFCSetPutRangeFirstChar(theSet, theRange.location); | |
2077 | __CFCSetPutRangeLength(theSet, theRange.length); | |
2078 | __CFCSetPutHasHashValue(theSet, false); | |
2079 | return; | |
2080 | } else if (__CFCSetIsRange(theSet)) { | |
2081 | CFIndex firstChar = __CFCSetRangeFirstChar(theSet); | |
2082 | CFIndex length = __CFCSetRangeLength(theSet); | |
2083 | ||
2084 | if (firstChar == theRange.location) { | |
856091c5 | 2085 | __CFCSetPutRangeLength(theSet, __CFMax(length, theRange.length)); |
9ce05555 A |
2086 | __CFCSetPutHasHashValue(theSet, false); |
2087 | return; | |
2088 | } else if (firstChar < theRange.location && theRange.location <= firstChar + length) { | |
2089 | if (firstChar + length < theRange.location + theRange.length) __CFCSetPutRangeLength(theSet, theRange.length + (theRange.location - firstChar)); | |
2090 | __CFCSetPutHasHashValue(theSet, false); | |
2091 | return; | |
2092 | } else if (theRange.location < firstChar && firstChar <= theRange.location + theRange.length) { | |
2093 | __CFCSetPutRangeFirstChar(theSet, theRange.location); | |
2094 | __CFCSetPutRangeLength(theSet, length + (firstChar - theRange.location)); | |
2095 | __CFCSetPutHasHashValue(theSet, false); | |
2096 | return; | |
2097 | } | |
2098 | } else if (__CFCSetIsString(theSet) && __CFCSetStringLength(theSet) + theRange.length < __kCFStringCharSetMax) { | |
2099 | UniChar *buffer; | |
2100 | if (!__CFCSetStringBuffer(theSet)) | |
bd5b749c | 2101 | __CFCSetPutStringBuffer(theSet, (UniChar *)CFAllocatorAllocate(CFGetAllocator(theSet), __kCFStringCharSetMax * sizeof(UniChar), 0)); |
9ce05555 A |
2102 | buffer = __CFCSetStringBuffer(theSet) + __CFCSetStringLength(theSet); |
2103 | __CFCSetPutStringLength(theSet, __CFCSetStringLength(theSet) + theRange.length); | |
bd5b749c | 2104 | while (theRange.length--) *buffer++ = (UniChar)theRange.location++; |
9ce05555 A |
2105 | qsort(__CFCSetStringBuffer(theSet), __CFCSetStringLength(theSet), sizeof(UniChar), chcompar); |
2106 | __CFCSetPutHasHashValue(theSet, false); | |
2107 | return; | |
2108 | } | |
2109 | } | |
2110 | ||
2111 | // OK, I have to be a bitmap | |
2112 | __CFCSetMakeBitmap(theSet); | |
2113 | __CFCSetAddNonBMPPlanesInRange(theSet, theRange); | |
2114 | if (theRange.location < 0x10000) { // theRange is in BMP | |
2115 | if (theRange.location + theRange.length >= NUMCHARACTERS) theRange.length = NUMCHARACTERS - theRange.location; | |
bd5b749c | 2116 | __CFCSetBitmapAddCharactersInRange(__CFCSetBitmapBits(theSet), (UniChar)theRange.location, (UniChar)(theRange.location + theRange.length - 1)); |
9ce05555 A |
2117 | } |
2118 | __CFCSetPutHasHashValue(theSet, false); | |
2119 | ||
2120 | if (__CFCheckForExapendedSet) __CFCheckForExpandedSet(theSet); | |
2121 | } | |
2122 | ||
2123 | void CFCharacterSetRemoveCharactersInRange(CFMutableCharacterSetRef theSet, CFRange theRange) { | |
856091c5 | 2124 | CF_OBJC_FUNCDISPATCHV(__kCFCharacterSetTypeID, void, (NSMutableCharacterSet *)theSet, removeCharactersInRange:NSMakeRange(theRange.location, theRange.length)); |
9ce05555 A |
2125 | |
2126 | __CFCSetValidateTypeAndMutability(theSet, __PRETTY_FUNCTION__); | |
2127 | __CFCSetValidateRange(theRange, __PRETTY_FUNCTION__); | |
a48904a4 A |
2128 | |
2129 | if (__CFCSetIsBuiltin((CFCharacterSetRef)theSet) && !__CFCSetIsMutable((CFCharacterSetRef)theSet) && !__CFCSetIsInverted((CFCharacterSetRef)theSet)) { | |
2130 | CFCharacterSetRef sharedSet = CFCharacterSetGetPredefined(__CFCSetBuiltinType((CFCharacterSetRef)theSet)); | |
2131 | if (sharedSet == theSet) { // We're trying to dealloc the builtin set | |
2132 | CFAssert1(0, __kCFLogAssertion, "%s: Trying to mutable predefined set.", __PRETTY_FUNCTION__); | |
2133 | return; // We don't mutate builtin set | |
2134 | } | |
2135 | } | |
9ce05555 A |
2136 | |
2137 | if (!theRange.length || (!__CFCSetIsInverted(theSet) && __CFCSetIsEmpty(theSet))) return; // empty set | |
2138 | ||
2139 | if (__CFCSetIsInverted(theSet)) { | |
2140 | if (__CFCSetIsEmpty(theSet)) { | |
2141 | __CFCSetPutClassType(theSet, __kCFCharSetClassRange); | |
2142 | __CFCSetPutRangeFirstChar(theSet, theRange.location); | |
2143 | __CFCSetPutRangeLength(theSet, theRange.length); | |
2144 | __CFCSetPutHasHashValue(theSet, false); | |
2145 | return; | |
2146 | } else if (__CFCSetIsRange(theSet)) { | |
2147 | CFIndex firstChar = __CFCSetRangeFirstChar(theSet); | |
2148 | CFIndex length = __CFCSetRangeLength(theSet); | |
2149 | ||
2150 | if (firstChar == theRange.location) { | |
2151 | __CFCSetPutRangeLength(theSet, __CFMin(length, theRange.length)); | |
2152 | __CFCSetPutHasHashValue(theSet, false); | |
2153 | return; | |
2154 | } else if (firstChar < theRange.location && theRange.location <= firstChar + length) { | |
2155 | if (firstChar + length < theRange.location + theRange.length) __CFCSetPutRangeLength(theSet, theRange.length + (theRange.location - firstChar)); | |
2156 | __CFCSetPutHasHashValue(theSet, false); | |
2157 | return; | |
2158 | } else if (theRange.location < firstChar && firstChar <= theRange.location + theRange.length) { | |
2159 | __CFCSetPutRangeFirstChar(theSet, theRange.location); | |
2160 | __CFCSetPutRangeLength(theSet, length + (firstChar - theRange.location)); | |
2161 | __CFCSetPutHasHashValue(theSet, false); | |
2162 | return; | |
2163 | } | |
2164 | } else if (__CFCSetIsString(theSet) && __CFCSetStringLength(theSet) + theRange.length < __kCFStringCharSetMax) { | |
2165 | UniChar *buffer; | |
2166 | if (!__CFCSetStringBuffer(theSet)) | |
bd5b749c | 2167 | __CFCSetPutStringBuffer(theSet, (UniChar *)CFAllocatorAllocate(CFGetAllocator(theSet), __kCFStringCharSetMax * sizeof(UniChar), 0)); |
9ce05555 A |
2168 | buffer = __CFCSetStringBuffer(theSet) + __CFCSetStringLength(theSet); |
2169 | __CFCSetPutStringLength(theSet, __CFCSetStringLength(theSet) + theRange.length); | |
bd5b749c | 2170 | while (theRange.length--) *buffer++ = (UniChar)theRange.location++; |
9ce05555 A |
2171 | qsort(__CFCSetStringBuffer(theSet), __CFCSetStringLength(theSet), sizeof(UniChar), chcompar); |
2172 | __CFCSetPutHasHashValue(theSet, false); | |
2173 | return; | |
2174 | } | |
2175 | } | |
2176 | ||
2177 | // OK, I have to be a bitmap | |
2178 | __CFCSetMakeBitmap(theSet); | |
2179 | __CFCSetRemoveNonBMPPlanesInRange(theSet, theRange); | |
2180 | if (theRange.location < 0x10000) { // theRange is in BMP | |
2181 | if (theRange.location + theRange.length > NUMCHARACTERS) theRange.length = NUMCHARACTERS - theRange.location; | |
2182 | if (theRange.location == 0 && theRange.length == NUMCHARACTERS) { // Remove all | |
2183 | CFAllocatorDeallocate(CFGetAllocator(theSet), __CFCSetBitmapBits(theSet)); | |
2184 | __CFCSetPutBitmapBits(theSet, NULL); | |
2185 | } else { | |
bd5b749c | 2186 | __CFCSetBitmapRemoveCharactersInRange(__CFCSetBitmapBits(theSet), (UniChar)theRange.location, (UniChar)(theRange.location + theRange.length - 1)); |
9ce05555 A |
2187 | } |
2188 | } | |
2189 | ||
2190 | __CFCSetPutHasHashValue(theSet, false); | |
2191 | if (__CFCheckForExapendedSet) __CFCheckForExpandedSet(theSet); | |
2192 | } | |
2193 | ||
2194 | void CFCharacterSetAddCharactersInString(CFMutableCharacterSetRef theSet, CFStringRef theString) { | |
cf7d2af9 | 2195 | UniChar *buffer; |
9ce05555 | 2196 | CFIndex length; |
cf7d2af9 | 2197 | BOOL hasSurrogate = NO; |
9ce05555 | 2198 | |
856091c5 | 2199 | CF_OBJC_FUNCDISPATCHV(__kCFCharacterSetTypeID, void, (NSMutableCharacterSet *)theSet, addCharactersInString:(NSString *)theString); |
9ce05555 A |
2200 | |
2201 | __CFCSetValidateTypeAndMutability(theSet, __PRETTY_FUNCTION__); | |
a48904a4 A |
2202 | |
2203 | if (__CFCSetIsBuiltin((CFCharacterSetRef)theSet) && !__CFCSetIsMutable((CFCharacterSetRef)theSet) && !__CFCSetIsInverted((CFCharacterSetRef)theSet)) { | |
2204 | CFCharacterSetRef sharedSet = CFCharacterSetGetPredefined(__CFCSetBuiltinType((CFCharacterSetRef)theSet)); | |
2205 | if (sharedSet == theSet) { // We're trying to dealloc the builtin set | |
2206 | CFAssert1(0, __kCFLogAssertion, "%s: Trying to mutable predefined set.", __PRETTY_FUNCTION__); | |
2207 | return; // We don't mutate builtin set | |
2208 | } | |
2209 | } | |
9ce05555 A |
2210 | |
2211 | if ((__CFCSetIsEmpty(theSet) && __CFCSetIsInverted(theSet)) || !(length = CFStringGetLength(theString))) return; | |
2212 | ||
2213 | if (!__CFCSetIsInverted(theSet)) { | |
2214 | CFIndex newLength = length + (__CFCSetIsEmpty(theSet) ? 0 : (__CFCSetIsString(theSet) ? __CFCSetStringLength(theSet) : __kCFStringCharSetMax)); | |
2215 | ||
2216 | if (newLength < __kCFStringCharSetMax) { | |
cf7d2af9 A |
2217 | buffer = __CFCSetStringBuffer(theSet); |
2218 | ||
2219 | if (NULL == buffer) { | |
2220 | buffer = (UniChar *)CFAllocatorAllocate(CFGetAllocator(theSet), __kCFStringCharSetMax * sizeof(UniChar), 0); | |
2221 | } else { | |
2222 | buffer += __CFCSetStringLength(theSet); | |
2223 | } | |
9ce05555 | 2224 | |
9ce05555 | 2225 | CFStringGetCharacters(theString, CFRangeMake(0, length), (UniChar*)buffer); |
cf7d2af9 A |
2226 | |
2227 | if (length > 1) { | |
2228 | UTF16Char *characters = buffer; | |
2229 | const UTF16Char *charactersLimit = characters + length; | |
2230 | ||
2231 | while (characters < charactersLimit) { | |
2232 | if (CFStringIsSurrogateHighCharacter(*characters) || CFStringIsSurrogateLowCharacter(*characters)) { | |
2233 | memmove(characters, characters + 1, (charactersLimit - (characters + 1)) * sizeof(*characters)); | |
2234 | --charactersLimit; | |
2235 | hasSurrogate = YES; | |
2236 | } else { | |
2237 | ++characters; | |
2238 | } | |
2239 | } | |
2240 | ||
2241 | newLength -= (length - (charactersLimit - buffer)); | |
2242 | } | |
2243 | ||
2244 | if (0 == newLength) { | |
2245 | if (NULL == __CFCSetStringBuffer(theSet)) CFAllocatorDeallocate(CFGetAllocator(theSet), buffer); | |
2246 | } else { | |
2247 | if (NULL == __CFCSetStringBuffer(theSet)) { | |
2248 | __CFCSetPutClassType(theSet, __kCFCharSetClassString); | |
2249 | __CFCSetPutStringBuffer(theSet, buffer); | |
2250 | } | |
2251 | __CFCSetPutStringLength(theSet, newLength); | |
2252 | qsort(__CFCSetStringBuffer(theSet), newLength, sizeof(UniChar), chcompar); | |
2253 | } | |
9ce05555 | 2254 | __CFCSetPutHasHashValue(theSet, false); |
cf7d2af9 A |
2255 | |
2256 | if (hasSurrogate) __CFApplySurrogatesInString(theSet, theString, &CFCharacterSetAddCharactersInRange); | |
2257 | ||
9ce05555 A |
2258 | return; |
2259 | } | |
2260 | } | |
2261 | ||
2262 | // OK, I have to be a bitmap | |
2263 | __CFCSetMakeBitmap(theSet); | |
cf7d2af9 A |
2264 | CFStringInlineBuffer inlineBuffer; |
2265 | CFIndex idx; | |
2266 | ||
2267 | CFStringInitInlineBuffer(theString, &inlineBuffer, CFRangeMake(0, length)); | |
2268 | ||
2269 | for (idx = 0;idx < length;idx++) { | |
2270 | UTF16Char character = __CFStringGetCharacterFromInlineBufferQuick(&inlineBuffer, idx); | |
9ce05555 | 2271 | |
cf7d2af9 A |
2272 | if (CFStringIsSurrogateHighCharacter(character) || CFStringIsSurrogateLowCharacter(character)) { |
2273 | hasSurrogate = YES; | |
2274 | } else { | |
2275 | __CFCSetBitmapAddCharacter(__CFCSetBitmapBits(theSet), character); | |
2276 | } | |
9ce05555 | 2277 | } |
cf7d2af9 | 2278 | |
9ce05555 | 2279 | __CFCSetPutHasHashValue(theSet, false); |
cf7d2af9 | 2280 | |
9ce05555 | 2281 | if (__CFCheckForExapendedSet) __CFCheckForExpandedSet(theSet); |
cf7d2af9 A |
2282 | |
2283 | if (hasSurrogate) __CFApplySurrogatesInString(theSet, theString, &CFCharacterSetAddCharactersInRange); | |
9ce05555 A |
2284 | } |
2285 | ||
2286 | void CFCharacterSetRemoveCharactersInString(CFMutableCharacterSetRef theSet, CFStringRef theString) { | |
cf7d2af9 | 2287 | UniChar *buffer; |
9ce05555 | 2288 | CFIndex length; |
cf7d2af9 | 2289 | BOOL hasSurrogate = NO; |
9ce05555 | 2290 | |
856091c5 | 2291 | CF_OBJC_FUNCDISPATCHV(__kCFCharacterSetTypeID, void, (NSMutableCharacterSet *)theSet, removeCharactersInString:(NSString *)theString); |
9ce05555 A |
2292 | |
2293 | __CFCSetValidateTypeAndMutability(theSet, __PRETTY_FUNCTION__); | |
a48904a4 A |
2294 | |
2295 | if (__CFCSetIsBuiltin((CFCharacterSetRef)theSet) && !__CFCSetIsMutable((CFCharacterSetRef)theSet) && !__CFCSetIsInverted((CFCharacterSetRef)theSet)) { | |
2296 | CFCharacterSetRef sharedSet = CFCharacterSetGetPredefined(__CFCSetBuiltinType((CFCharacterSetRef)theSet)); | |
2297 | if (sharedSet == theSet) { // We're trying to dealloc the builtin set | |
2298 | CFAssert1(0, __kCFLogAssertion, "%s: Trying to mutable predefined set.", __PRETTY_FUNCTION__); | |
2299 | return; // We don't mutate builtin set | |
2300 | } | |
2301 | } | |
9ce05555 A |
2302 | |
2303 | if ((__CFCSetIsEmpty(theSet) && !__CFCSetIsInverted(theSet)) || !(length = CFStringGetLength(theString))) return; | |
2304 | ||
2305 | if (__CFCSetIsInverted(theSet)) { | |
2306 | CFIndex newLength = length + (__CFCSetIsEmpty(theSet) ? 0 : (__CFCSetIsString(theSet) ? __CFCSetStringLength(theSet) : __kCFStringCharSetMax)); | |
cf7d2af9 | 2307 | |
9ce05555 | 2308 | if (newLength < __kCFStringCharSetMax) { |
cf7d2af9 A |
2309 | buffer = __CFCSetStringBuffer(theSet); |
2310 | ||
2311 | if (NULL == buffer) { | |
2312 | buffer = (UniChar *)CFAllocatorAllocate(CFGetAllocator(theSet), __kCFStringCharSetMax * sizeof(UniChar), 0); | |
2313 | } else { | |
2314 | buffer += __CFCSetStringLength(theSet); | |
2315 | } | |
2316 | ||
2317 | CFStringGetCharacters(theString, CFRangeMake(0, length), (UniChar*)buffer); | |
2318 | ||
2319 | if (length > 1) { | |
2320 | UTF16Char *characters = buffer; | |
2321 | const UTF16Char *charactersLimit = characters + length; | |
2322 | ||
2323 | while (characters < charactersLimit) { | |
2324 | if (CFStringIsSurrogateHighCharacter(*characters) || CFStringIsSurrogateLowCharacter(*characters)) { | |
2325 | memmove(characters, characters + 1, charactersLimit - (characters + 1)); | |
2326 | --charactersLimit; | |
2327 | hasSurrogate = YES; | |
2328 | } | |
2329 | ++characters; | |
2330 | } | |
2331 | ||
2332 | newLength -= (length - (charactersLimit - buffer)); | |
2333 | } | |
2334 | ||
2335 | if (NULL == __CFCSetStringBuffer(theSet)) { | |
2336 | __CFCSetPutClassType(theSet, __kCFCharSetClassString); | |
2337 | __CFCSetPutStringBuffer(theSet, buffer); | |
2338 | } | |
9ce05555 | 2339 | __CFCSetPutStringLength(theSet, newLength); |
9ce05555 A |
2340 | qsort(__CFCSetStringBuffer(theSet), newLength, sizeof(UniChar), chcompar); |
2341 | __CFCSetPutHasHashValue(theSet, false); | |
cf7d2af9 A |
2342 | |
2343 | if (hasSurrogate) __CFApplySurrogatesInString(theSet, theString, &CFCharacterSetRemoveCharactersInRange); | |
2344 | ||
9ce05555 A |
2345 | return; |
2346 | } | |
2347 | } | |
2348 | ||
2349 | // OK, I have to be a bitmap | |
2350 | __CFCSetMakeBitmap(theSet); | |
cf7d2af9 A |
2351 | CFStringInlineBuffer inlineBuffer; |
2352 | CFIndex idx; | |
2353 | ||
2354 | CFStringInitInlineBuffer(theString, &inlineBuffer, CFRangeMake(0, length)); | |
2355 | ||
2356 | for (idx = 0;idx < length;idx++) { | |
2357 | UTF16Char character = __CFStringGetCharacterFromInlineBufferQuick(&inlineBuffer, idx); | |
2358 | ||
2359 | if (CFStringIsSurrogateHighCharacter(character) || CFStringIsSurrogateLowCharacter(character)) { | |
2360 | hasSurrogate = YES; | |
2361 | } else { | |
2362 | __CFCSetBitmapRemoveCharacter(__CFCSetBitmapBits(theSet), character); | |
2363 | } | |
9ce05555 | 2364 | } |
cf7d2af9 | 2365 | |
9ce05555 A |
2366 | __CFCSetPutHasHashValue(theSet, false); |
2367 | if (__CFCheckForExapendedSet) __CFCheckForExpandedSet(theSet); | |
cf7d2af9 A |
2368 | |
2369 | if (hasSurrogate) __CFApplySurrogatesInString(theSet, theString, &CFCharacterSetRemoveCharactersInRange); | |
9ce05555 A |
2370 | } |
2371 | ||
2372 | void CFCharacterSetUnion(CFMutableCharacterSetRef theSet, CFCharacterSetRef theOtherSet) { | |
2373 | CFCharacterSetRef expandedSet = NULL; | |
2374 | ||
856091c5 | 2375 | CF_OBJC_FUNCDISPATCHV(__kCFCharacterSetTypeID, void, (NSMutableCharacterSet *)theSet, formUnionWithCharacterSet:(NSCharacterSet *)theOtherSet); |
9ce05555 A |
2376 | |
2377 | __CFCSetValidateTypeAndMutability(theSet, __PRETTY_FUNCTION__); | |
a48904a4 A |
2378 | |
2379 | if (__CFCSetIsBuiltin((CFCharacterSetRef)theSet) && !__CFCSetIsMutable((CFCharacterSetRef)theSet) && !__CFCSetIsInverted((CFCharacterSetRef)theSet)) { | |
2380 | CFCharacterSetRef sharedSet = CFCharacterSetGetPredefined(__CFCSetBuiltinType((CFCharacterSetRef)theSet)); | |
2381 | if (sharedSet == theSet) { // We're trying to dealloc the builtin set | |
2382 | CFAssert1(0, __kCFLogAssertion, "%s: Trying to mutable predefined set.", __PRETTY_FUNCTION__); | |
2383 | return; // We don't mutate builtin set | |
2384 | } | |
2385 | } | |
9ce05555 A |
2386 | |
2387 | if (__CFCSetIsEmpty(theSet) && __CFCSetIsInverted(theSet)) return; // Inverted empty set contains all char | |
2388 | ||
2389 | if (!CF_IS_OBJC(__kCFCharacterSetTypeID, theOtherSet) || (expandedSet = __CFCharacterSetGetExpandedSetForNSCharacterSet(theOtherSet))) { // Really CF, we can do some trick here | |
2390 | if (expandedSet) theOtherSet = expandedSet; | |
2391 | ||
2392 | if (__CFCSetIsEmpty(theOtherSet)) { | |
2393 | if (__CFCSetIsInverted(theOtherSet)) { | |
2394 | if (__CFCSetIsString(theSet) && __CFCSetStringBuffer(theSet)) { | |
2395 | CFAllocatorDeallocate(CFGetAllocator(theSet), __CFCSetStringBuffer(theSet)); | |
2396 | } else if (__CFCSetIsBitmap(theSet) && __CFCSetBitmapBits(theSet)) { | |
2397 | CFAllocatorDeallocate(CFGetAllocator(theSet), __CFCSetBitmapBits(theSet)); | |
2398 | } else if (__CFCSetIsCompactBitmap(theSet) && __CFCSetCompactBitmapBits(theSet)) { | |
2399 | CFAllocatorDeallocate(CFGetAllocator(theSet), __CFCSetCompactBitmapBits(theSet)); | |
2400 | } | |
2401 | __CFCSetPutClassType(theSet, __kCFCharSetClassRange); | |
2402 | __CFCSetPutRangeLength(theSet, 0); | |
2403 | __CFCSetPutIsInverted(theSet, true); | |
2404 | __CFCSetPutHasHashValue(theSet, false); | |
2405 | __CFCSetDeallocateAnnexPlane(theSet); | |
9ce05555 | 2406 | } |
bd5b749c | 2407 | } else if (__CFCSetIsBuiltin(theOtherSet) && __CFCSetIsEmpty(theSet)) { // theSet can be builtin set |
9ce05555 A |
2408 | __CFCSetPutClassType(theSet, __kCFCharSetClassBuiltin); |
2409 | __CFCSetPutBuiltinType(theSet, __CFCSetBuiltinType(theOtherSet)); | |
cf7d2af9 A |
2410 | if (__CFCSetIsInverted(theOtherSet)) __CFCSetPutIsInverted(theSet, true); |
2411 | if (__CFCSetAnnexIsInverted(theOtherSet)) __CFCSetAnnexSetIsInverted(theSet, true); | |
9ce05555 | 2412 | __CFCSetPutHasHashValue(theSet, false); |
9ce05555 | 2413 | } else { |
bd5b749c A |
2414 | if (__CFCSetIsRange(theOtherSet)) { |
2415 | if (__CFCSetIsInverted(theOtherSet)) { | |
2416 | UTF32Char firstChar = __CFCSetRangeFirstChar(theOtherSet); | |
2417 | CFIndex length = __CFCSetRangeLength(theOtherSet); | |
2418 | ||
2419 | if (firstChar > 0) CFCharacterSetAddCharactersInRange(theSet, CFRangeMake(0, firstChar)); | |
2420 | firstChar += length; | |
2421 | length = 0x110000 - firstChar; | |
2422 | CFCharacterSetAddCharactersInRange(theSet, CFRangeMake(firstChar, length)); | |
2423 | } else { | |
2424 | CFCharacterSetAddCharactersInRange(theSet, CFRangeMake(__CFCSetRangeFirstChar(theOtherSet), __CFCSetRangeLength(theOtherSet))); | |
2425 | } | |
2426 | } else if (__CFCSetIsString(theOtherSet)) { | |
2427 | CFStringRef string = CFStringCreateWithCharactersNoCopy(CFGetAllocator(theSet), __CFCSetStringBuffer(theOtherSet), __CFCSetStringLength(theOtherSet), kCFAllocatorNull); | |
2428 | CFCharacterSetAddCharactersInString(theSet, string); | |
2429 | CFRelease(string); | |
9ce05555 | 2430 | } else { |
bd5b749c A |
2431 | __CFCSetMakeBitmap(theSet); |
2432 | if (__CFCSetIsBitmap(theOtherSet)) { | |
2433 | UInt32 *bitmap1 = (UInt32*)__CFCSetBitmapBits(theSet); | |
2434 | UInt32 *bitmap2 = (UInt32*)__CFCSetBitmapBits(theOtherSet); | |
2435 | CFIndex length = __kCFBitmapSize / sizeof(UInt32); | |
2436 | while (length--) *bitmap1++ |= *bitmap2++; | |
2437 | } else { | |
2438 | UInt32 *bitmap1 = (UInt32*)__CFCSetBitmapBits(theSet); | |
2439 | UInt32 *bitmap2; | |
2440 | CFIndex length = __kCFBitmapSize / sizeof(UInt32); | |
2441 | uint8_t bitmapBuffer[__kCFBitmapSize]; | |
2442 | __CFCSetGetBitmap(theOtherSet, bitmapBuffer); | |
2443 | bitmap2 = (UInt32*)bitmapBuffer; | |
2444 | while (length--) *bitmap1++ |= *bitmap2++; | |
2445 | } | |
2446 | __CFCSetPutHasHashValue(theSet, false); | |
9ce05555 | 2447 | } |
bd5b749c A |
2448 | if (__CFCSetHasNonBMPPlane(theOtherSet)) { |
2449 | CFMutableCharacterSetRef otherSetPlane; | |
2450 | int idx; | |
9ce05555 | 2451 | |
bd5b749c A |
2452 | for (idx = 1;idx <= MAX_ANNEX_PLANE;idx++) { |
2453 | if ((otherSetPlane = (CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSetNoAlloc(theOtherSet, idx))) { | |
2454 | CFCharacterSetUnion((CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSet(theSet, idx), otherSetPlane); | |
2455 | } | |
9ce05555 | 2456 | } |
cf7d2af9 A |
2457 | } else if (__CFCSetAnnexIsInverted(theOtherSet)) { |
2458 | if (__CFCSetHasNonBMPPlane(theSet)) __CFCSetDeallocateAnnexPlane(theSet); | |
2459 | __CFCSetAnnexSetIsInverted(theSet, true); | |
bd5b749c A |
2460 | } else if (__CFCSetIsBuiltin(theOtherSet)) { |
2461 | CFMutableCharacterSetRef annexPlane; | |
2462 | uint8_t bitmapBuffer[__kCFBitmapSize]; | |
2463 | uint8_t result; | |
2464 | int planeIndex; | |
2465 | Boolean isOtherAnnexPlaneInverted = __CFCSetAnnexIsInverted(theOtherSet); | |
2466 | UInt32 *bitmap1; | |
2467 | UInt32 *bitmap2; | |
2468 | CFIndex length; | |
9ce05555 | 2469 | |
bd5b749c A |
2470 | for (planeIndex = 1;planeIndex <= MAX_ANNEX_PLANE;planeIndex++) { |
2471 | result = CFUniCharGetBitmapForPlane(__CFCSetBuiltinType(theOtherSet), planeIndex, bitmapBuffer, (isOtherAnnexPlaneInverted != 0)); | |
2472 | if (result != kCFUniCharBitmapEmpty) { | |
2473 | annexPlane = (CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSet(theSet, planeIndex); | |
2474 | if (result == kCFUniCharBitmapAll) { | |
2475 | CFCharacterSetAddCharactersInRange(annexPlane, CFRangeMake(0x0000, 0x10000)); | |
2476 | } else { | |
2477 | __CFCSetMakeBitmap(annexPlane); | |
2478 | bitmap1 = (UInt32 *)__CFCSetBitmapBits(annexPlane); | |
2479 | length = __kCFBitmapSize / sizeof(UInt32); | |
2480 | bitmap2 = (UInt32*)bitmapBuffer; | |
2481 | while (length--) *bitmap1++ |= *bitmap2++; | |
2482 | } | |
9ce05555 A |
2483 | } |
2484 | } | |
2485 | } | |
2486 | } | |
2487 | if (__CFCheckForExapendedSet) __CFCheckForExpandedSet(theSet); | |
2488 | } else { // It's NSCharacterSet | |
bd5b749c | 2489 | CFDataRef bitmapRep = CFCharacterSetCreateBitmapRepresentation(kCFAllocatorSystemDefault, theOtherSet); |
9ce05555 A |
2490 | const UInt32 *bitmap2 = (bitmapRep && CFDataGetLength(bitmapRep) ? (const UInt32 *)CFDataGetBytePtr(bitmapRep) : NULL); |
2491 | if (bitmap2) { | |
2492 | UInt32 *bitmap1; | |
2493 | CFIndex length = __kCFBitmapSize / sizeof(UInt32); | |
2494 | __CFCSetMakeBitmap(theSet); | |
2495 | bitmap1 = (UInt32*)__CFCSetBitmapBits(theSet); | |
2496 | while (length--) *bitmap1++ |= *bitmap2++; | |
2497 | __CFCSetPutHasHashValue(theSet, false); | |
2498 | } | |
2499 | CFRelease(bitmapRep); | |
2500 | } | |
2501 | } | |
2502 | ||
2503 | void CFCharacterSetIntersect(CFMutableCharacterSetRef theSet, CFCharacterSetRef theOtherSet) { | |
2504 | CFCharacterSetRef expandedSet = NULL; | |
2505 | ||
856091c5 | 2506 | CF_OBJC_FUNCDISPATCHV(__kCFCharacterSetTypeID, void, (NSMutableCharacterSet *)theSet, formIntersectionWithCharacterSet:(NSCharacterSet *)theOtherSet); |
9ce05555 A |
2507 | |
2508 | __CFCSetValidateTypeAndMutability(theSet, __PRETTY_FUNCTION__); | |
a48904a4 A |
2509 | |
2510 | if (__CFCSetIsBuiltin((CFCharacterSetRef)theSet) && !__CFCSetIsMutable((CFCharacterSetRef)theSet) && !__CFCSetIsInverted((CFCharacterSetRef)theSet)) { | |
2511 | CFCharacterSetRef sharedSet = CFCharacterSetGetPredefined(__CFCSetBuiltinType((CFCharacterSetRef)theSet)); | |
2512 | if (sharedSet == theSet) { // We're trying to dealloc the builtin set | |
2513 | CFAssert1(0, __kCFLogAssertion, "%s: Trying to mutable predefined set.", __PRETTY_FUNCTION__); | |
2514 | return; // We don't mutate builtin set | |
2515 | } | |
2516 | } | |
9ce05555 A |
2517 | |
2518 | if (__CFCSetIsEmpty(theSet) && !__CFCSetIsInverted(theSet)) return; // empty set | |
2519 | ||
2520 | if (!CF_IS_OBJC(__kCFCharacterSetTypeID, theOtherSet) || (expandedSet = __CFCharacterSetGetExpandedSetForNSCharacterSet(theOtherSet))) { // Really CF, we can do some trick here | |
2521 | if (expandedSet) theOtherSet = expandedSet; | |
2522 | ||
2523 | if (__CFCSetIsEmpty(theOtherSet)) { | |
2524 | if (!__CFCSetIsInverted(theOtherSet)) { | |
2525 | if (__CFCSetIsString(theSet) && __CFCSetStringBuffer(theSet)) { | |
2526 | CFAllocatorDeallocate(CFGetAllocator(theSet), __CFCSetStringBuffer(theSet)); | |
2527 | } else if (__CFCSetIsBitmap(theSet) && __CFCSetBitmapBits(theSet)) { | |
2528 | CFAllocatorDeallocate(CFGetAllocator(theSet), __CFCSetBitmapBits(theSet)); | |
2529 | } else if (__CFCSetIsCompactBitmap(theSet) && __CFCSetCompactBitmapBits(theSet)) { | |
2530 | CFAllocatorDeallocate(CFGetAllocator(theSet), __CFCSetCompactBitmapBits(theSet)); | |
2531 | } | |
2532 | __CFCSetPutClassType(theSet, __kCFCharSetClassBitmap); | |
2533 | __CFCSetPutBitmapBits(theSet, NULL); | |
2534 | __CFCSetPutIsInverted(theSet, false); | |
2535 | theSet->_hashValue = 0; | |
2536 | __CFCSetPutHasHashValue(theSet, true); | |
2537 | __CFCSetDeallocateAnnexPlane(theSet); | |
2538 | } | |
2539 | } else if (__CFCSetIsEmpty(theSet)) { // non inverted empty set contains all character | |
2540 | __CFCSetPutClassType(theSet, __CFCSetClassType(theOtherSet)); | |
2541 | __CFCSetPutHasHashValue(theSet, __CFCSetHasHashValue(theOtherSet)); | |
2542 | __CFCSetPutIsInverted(theSet, __CFCSetIsInverted(theOtherSet)); | |
2543 | theSet->_hashValue = theOtherSet->_hashValue; | |
2544 | if (__CFCSetHasNonBMPPlane(theOtherSet)) { | |
2545 | CFMutableCharacterSetRef otherSetPlane; | |
2546 | int idx; | |
2547 | for (idx = 1;idx <= MAX_ANNEX_PLANE;idx++) { | |
2548 | if ((otherSetPlane = (CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSetNoAlloc(theOtherSet, idx))) { | |
2549 | otherSetPlane = (CFMutableCharacterSetRef)CFCharacterSetCreateMutableCopy(CFGetAllocator(theSet), otherSetPlane); | |
2550 | __CFCSetPutCharacterSetToAnnexPlane(theSet, otherSetPlane, idx); | |
2551 | CFRelease(otherSetPlane); | |
2552 | } | |
2553 | } | |
2554 | __CFCSetAnnexSetIsInverted(theSet, __CFCSetAnnexIsInverted(theOtherSet)); | |
2555 | } | |
2556 | ||
2557 | switch (__CFCSetClassType(theOtherSet)) { | |
2558 | case __kCFCharSetClassBuiltin: | |
2559 | __CFCSetPutBuiltinType(theSet, __CFCSetBuiltinType(theOtherSet)); | |
2560 | break; | |
2561 | ||
2562 | case __kCFCharSetClassRange: | |
2563 | __CFCSetPutRangeFirstChar(theSet, __CFCSetRangeFirstChar(theOtherSet)); | |
2564 | __CFCSetPutRangeLength(theSet, __CFCSetRangeLength(theOtherSet)); | |
2565 | break; | |
2566 | ||
2567 | case __kCFCharSetClassString: | |
2568 | __CFCSetPutStringLength(theSet, __CFCSetStringLength(theOtherSet)); | |
2569 | if (!__CFCSetStringBuffer(theSet)) | |
bd5b749c | 2570 | __CFCSetPutStringBuffer(theSet, (UniChar *)CFAllocatorAllocate(CFGetAllocator(theSet), __kCFStringCharSetMax * sizeof(UniChar), 0)); |
9ce05555 A |
2571 | memmove(__CFCSetStringBuffer(theSet), __CFCSetStringBuffer(theOtherSet), __CFCSetStringLength(theSet) * sizeof(UniChar)); |
2572 | break; | |
2573 | ||
2574 | case __kCFCharSetClassBitmap: | |
bd5b749c | 2575 | __CFCSetPutBitmapBits(theSet, (uint8_t *)CFAllocatorAllocate(CFGetAllocator(theSet), sizeof(uint8_t) * __kCFBitmapSize, 0)); |
9ce05555 A |
2576 | memmove(__CFCSetBitmapBits(theSet), __CFCSetBitmapBits(theOtherSet), __kCFBitmapSize); |
2577 | break; | |
2578 | ||
2579 | case __kCFCharSetClassCompactBitmap: { | |
2580 | const uint8_t *cBitmap = __CFCSetCompactBitmapBits(theOtherSet); | |
2581 | uint8_t *newBitmap; | |
2582 | uint32_t size = __CFCSetGetCompactBitmapSize(cBitmap); | |
bd5b749c | 2583 | newBitmap = (uint8_t *)CFAllocatorAllocate(CFGetAllocator(theSet), sizeof(uint8_t) * size, 0); |
9ce05555 A |
2584 | __CFCSetPutBitmapBits(theSet, newBitmap); |
2585 | memmove(newBitmap, cBitmap, size); | |
2586 | } | |
2587 | break; | |
2588 | ||
2589 | default: | |
2590 | CFAssert1(0, __kCFLogAssertion, "%s: Internal inconsistency error: unknown character set type", __PRETTY_FUNCTION__); // We should never come here | |
2591 | } | |
2592 | } else { | |
2593 | __CFCSetMakeBitmap(theSet); | |
2594 | if (__CFCSetIsBitmap(theOtherSet)) { | |
2595 | UInt32 *bitmap1 = (UInt32*)__CFCSetBitmapBits(theSet); | |
2596 | UInt32 *bitmap2 = (UInt32*)__CFCSetBitmapBits(theOtherSet); | |
2597 | CFIndex length = __kCFBitmapSize / sizeof(UInt32); | |
2598 | while (length--) *bitmap1++ &= *bitmap2++; | |
2599 | } else { | |
2600 | UInt32 *bitmap1 = (UInt32*)__CFCSetBitmapBits(theSet); | |
2601 | UInt32 *bitmap2; | |
2602 | CFIndex length = __kCFBitmapSize / sizeof(UInt32); | |
2603 | uint8_t bitmapBuffer[__kCFBitmapSize]; | |
2604 | __CFCSetGetBitmap(theOtherSet, bitmapBuffer); | |
2605 | bitmap2 = (UInt32*)bitmapBuffer; | |
2606 | while (length--) *bitmap1++ &= *bitmap2++; | |
2607 | } | |
2608 | __CFCSetPutHasHashValue(theSet, false); | |
2609 | if (__CFCSetHasNonBMPPlane(theOtherSet)) { | |
2610 | CFMutableCharacterSetRef annexPlane; | |
2611 | CFMutableCharacterSetRef otherSetPlane; | |
d7384798 | 2612 | CFMutableCharacterSetRef emptySet = CFCharacterSetCreateMutable(NULL); |
9ce05555 A |
2613 | int idx; |
2614 | for (idx = 1;idx <= MAX_ANNEX_PLANE;idx++) { | |
2615 | if ((otherSetPlane = (CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSetNoAlloc(theOtherSet, idx))) { | |
d7384798 | 2616 | if (__CFCSetAnnexIsInverted(theOtherSet)) CFCharacterSetInvert(otherSetPlane); |
9ce05555 | 2617 | annexPlane = (CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSet(theSet, idx); |
a48904a4 | 2618 | if (__CFCSetAnnexIsInverted(theSet)) CFCharacterSetInvert(annexPlane); |
9ce05555 | 2619 | CFCharacterSetIntersect(annexPlane, otherSetPlane); |
a48904a4 | 2620 | if (__CFCSetAnnexIsInverted(theSet)) CFCharacterSetInvert(annexPlane); |
d7384798 | 2621 | if (__CFCSetAnnexIsInverted(theOtherSet)) CFCharacterSetInvert(otherSetPlane); |
9ce05555 | 2622 | if (__CFCSetIsEmpty(annexPlane) && !__CFCSetIsInverted(annexPlane)) __CFCSetPutCharacterSetToAnnexPlane(theSet, NULL, idx); |
d7384798 A |
2623 | } else if ((annexPlane = (CFMutableCharacterSetRef) __CFCSetGetAnnexPlaneCharacterSetNoAlloc(theSet, idx))) { |
2624 | if (__CFCSetAnnexIsInverted(theSet)) { // if the annexPlane is inverted, we need to set the plane to empty | |
2625 | CFCharacterSetInvert(annexPlane); | |
2626 | CFCharacterSetIntersect(annexPlane, emptySet); | |
2627 | CFCharacterSetInvert(annexPlane); | |
2628 | } else { // the annexPlane is not inverted, we can clear the plane | |
2629 | __CFCSetPutCharacterSetToAnnexPlane(theSet, NULL, idx); | |
2630 | } | |
2631 | } else if ((__CFCSetGetAnnexPlaneCharacterSetNoAlloc(theSet, idx) == NULL) && __CFCSetAnnexIsInverted(theSet)) { | |
2632 | // the set has no such annex plane and the annex plane is inverted, it means the set contains everything in the annex plane | |
2633 | annexPlane = (CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSet(theSet, idx); | |
2634 | if (__CFCSetAnnexIsInverted(theSet)) CFCharacterSetInvert(annexPlane); | |
2635 | CFCharacterSetIntersect(annexPlane, emptySet); | |
2636 | if (__CFCSetAnnexIsInverted(theSet)) CFCharacterSetInvert(annexPlane); | |
9ce05555 A |
2637 | } |
2638 | } | |
d7384798 | 2639 | CFRelease(emptySet); |
9ce05555 | 2640 | if (!__CFCSetHasNonBMPPlane(theSet)) __CFCSetDeallocateAnnexPlane(theSet); |
cf7d2af9 | 2641 | } else if (__CFCSetIsBuiltin(theOtherSet) && !__CFCSetAnnexIsInverted(theOtherSet)) { |
9ce05555 A |
2642 | CFMutableCharacterSetRef annexPlane; |
2643 | uint8_t bitmapBuffer[__kCFBitmapSize]; | |
2644 | uint8_t result; | |
2645 | int planeIndex; | |
9ce05555 A |
2646 | UInt32 *bitmap1; |
2647 | UInt32 *bitmap2; | |
2648 | CFIndex length; | |
2649 | ||
2650 | for (planeIndex = 1;planeIndex <= MAX_ANNEX_PLANE;planeIndex++) { | |
2651 | annexPlane = (CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSetNoAlloc(theSet, planeIndex); | |
2652 | if (annexPlane) { | |
cf7d2af9 | 2653 | result = CFUniCharGetBitmapForPlane(__CFCSetBuiltinType(theOtherSet), planeIndex, bitmapBuffer, false); |
9ce05555 A |
2654 | if (result == kCFUniCharBitmapEmpty) { |
2655 | __CFCSetPutCharacterSetToAnnexPlane(theSet, NULL, planeIndex); | |
2656 | } else if (result == kCFUniCharBitmapFilled) { | |
2657 | Boolean isEmpty = true; | |
2658 | ||
2659 | __CFCSetMakeBitmap(annexPlane); | |
2660 | bitmap1 = (UInt32 *)__CFCSetBitmapBits(annexPlane); | |
2661 | length = __kCFBitmapSize / sizeof(UInt32); | |
2662 | bitmap2 = (UInt32*)bitmapBuffer; | |
2663 | ||
2664 | while (length--) { | |
2665 | if ((*bitmap1++ &= *bitmap2++)) isEmpty = false; | |
2666 | } | |
2667 | if (isEmpty) __CFCSetPutCharacterSetToAnnexPlane(theSet, NULL, planeIndex); | |
2668 | } | |
2669 | } | |
2670 | } | |
2671 | if (!__CFCSetHasNonBMPPlane(theSet)) __CFCSetDeallocateAnnexPlane(theSet); | |
2672 | } else if (__CFCSetIsRange(theOtherSet)) { | |
2673 | CFMutableCharacterSetRef tempOtherSet = CFCharacterSetCreateMutable(CFGetAllocator(theSet)); | |
2674 | CFMutableCharacterSetRef annexPlane; | |
2675 | CFMutableCharacterSetRef otherSetPlane; | |
d7384798 | 2676 | CFMutableCharacterSetRef emptySet = CFCharacterSetCreateMutable(NULL); |
9ce05555 A |
2677 | int idx; |
2678 | ||
2679 | __CFCSetAddNonBMPPlanesInRange(tempOtherSet, CFRangeMake(__CFCSetRangeFirstChar(theOtherSet), __CFCSetRangeLength(theOtherSet))); | |
2680 | ||
2681 | for (idx = 1;idx <= MAX_ANNEX_PLANE;idx++) { | |
2682 | if ((otherSetPlane = (CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSetNoAlloc(tempOtherSet, idx))) { | |
2683 | annexPlane = (CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSet(theSet, idx); | |
d7384798 | 2684 | if (__CFCSetAnnexIsInverted(tempOtherSet)) CFCharacterSetInvert(otherSetPlane); |
a48904a4 | 2685 | if (__CFCSetAnnexIsInverted(theSet)) CFCharacterSetInvert(annexPlane); |
9ce05555 | 2686 | CFCharacterSetIntersect(annexPlane, otherSetPlane); |
a48904a4 | 2687 | if (__CFCSetAnnexIsInverted(theSet)) CFCharacterSetInvert(annexPlane); |
d7384798 | 2688 | if (__CFCSetAnnexIsInverted(tempOtherSet)) CFCharacterSetInvert(otherSetPlane); |
9ce05555 | 2689 | if (__CFCSetIsEmpty(annexPlane) && !__CFCSetIsInverted(annexPlane)) __CFCSetPutCharacterSetToAnnexPlane(theSet, NULL, idx); |
d7384798 A |
2690 | } else if ((annexPlane = (CFMutableCharacterSetRef) __CFCSetGetAnnexPlaneCharacterSetNoAlloc(theSet, idx))) { |
2691 | if (__CFCSetAnnexIsInverted(theSet)) { | |
2692 | CFCharacterSetInvert(annexPlane); | |
2693 | CFCharacterSetIntersect(annexPlane, emptySet); | |
2694 | CFCharacterSetInvert(annexPlane); | |
2695 | } else { | |
2696 | __CFCSetPutCharacterSetToAnnexPlane(theSet, NULL, idx); | |
2697 | } | |
2698 | } else if ((__CFCSetGetAnnexPlaneCharacterSetNoAlloc(theSet, idx) == NULL) && __CFCSetAnnexIsInverted(theSet)) { | |
2699 | // the set has no such annex plane and the annex plane is inverted, it means the set contains everything in the annex plane | |
2700 | annexPlane = (CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSet(theSet, idx); | |
2701 | if (__CFCSetAnnexIsInverted(theSet)) CFCharacterSetInvert(annexPlane); | |
2702 | CFCharacterSetIntersect(annexPlane, emptySet); | |
2703 | if (__CFCSetAnnexIsInverted(theSet)) CFCharacterSetInvert(annexPlane); | |
9ce05555 A |
2704 | } |
2705 | } | |
2706 | if (!__CFCSetHasNonBMPPlane(theSet)) __CFCSetDeallocateAnnexPlane(theSet); | |
2707 | CFRelease(tempOtherSet); | |
d7384798 | 2708 | CFRelease(emptySet); |
cf7d2af9 | 2709 | } else if ((__CFCSetHasNonBMPPlane(theSet) || __CFCSetAnnexIsInverted(theSet)) && !__CFCSetAnnexIsInverted(theOtherSet)) { |
9ce05555 A |
2710 | __CFCSetDeallocateAnnexPlane(theSet); |
2711 | } | |
2712 | } | |
2713 | if (__CFCheckForExapendedSet) __CFCheckForExpandedSet(theSet); | |
2714 | } else { // It's NSCharacterSet | |
bd5b749c | 2715 | CFDataRef bitmapRep = CFCharacterSetCreateBitmapRepresentation(kCFAllocatorSystemDefault, theOtherSet); |
9ce05555 A |
2716 | const UInt32 *bitmap2 = (bitmapRep && CFDataGetLength(bitmapRep) ? (const UInt32 *)CFDataGetBytePtr(bitmapRep) : NULL); |
2717 | if (bitmap2) { | |
2718 | UInt32 *bitmap1; | |
2719 | CFIndex length = __kCFBitmapSize / sizeof(UInt32); | |
2720 | __CFCSetMakeBitmap(theSet); | |
2721 | bitmap1 = (UInt32*)__CFCSetBitmapBits(theSet); | |
2722 | while (length--) *bitmap1++ &= *bitmap2++; | |
2723 | __CFCSetPutHasHashValue(theSet, false); | |
2724 | } | |
2725 | CFRelease(bitmapRep); | |
2726 | } | |
2727 | } | |
2728 | ||
2729 | void CFCharacterSetInvert(CFMutableCharacterSetRef theSet) { | |
2730 | ||
856091c5 | 2731 | CF_OBJC_FUNCDISPATCHV(__kCFCharacterSetTypeID, void, (NSMutableCharacterSet *)theSet, invert); |
9ce05555 A |
2732 | |
2733 | __CFCSetValidateTypeAndMutability(theSet, __PRETTY_FUNCTION__); | |
a48904a4 A |
2734 | |
2735 | if (__CFCSetIsBuiltin((CFCharacterSetRef)theSet) && !__CFCSetIsMutable((CFCharacterSetRef)theSet) && !__CFCSetIsInverted((CFCharacterSetRef)theSet)) { | |
2736 | CFCharacterSetRef sharedSet = CFCharacterSetGetPredefined(__CFCSetBuiltinType((CFCharacterSetRef)theSet)); | |
2737 | if (sharedSet == theSet) { // We're trying to dealloc the builtin set | |
2738 | CFAssert1(0, __kCFLogAssertion, "%s: Trying to mutable predefined set.", __PRETTY_FUNCTION__); | |
2739 | return; // We don't mutate builtin set | |
2740 | } | |
2741 | } | |
9ce05555 A |
2742 | |
2743 | __CFCSetPutHasHashValue(theSet, false); | |
2744 | ||
2745 | if (__CFCSetClassType(theSet) == __kCFCharSetClassBitmap) { | |
2746 | CFIndex idx; | |
2747 | CFIndex count = __kCFBitmapSize / sizeof(UInt32); | |
2748 | UInt32 *bitmap = (UInt32*) __CFCSetBitmapBits(theSet); | |
2749 | ||
2750 | if (NULL == bitmap) { | |
bd5b749c | 2751 | bitmap = (UInt32 *)CFAllocatorAllocate(CFGetAllocator(theSet), __kCFBitmapSize, 0); |
9ce05555 | 2752 | __CFCSetPutBitmapBits(theSet, (uint8_t *)bitmap); |
bd5b749c | 2753 | for (idx = 0;idx < count;idx++) bitmap[idx] = ((UInt32)0xFFFFFFFF); |
9ce05555 A |
2754 | } else { |
2755 | for (idx = 0;idx < count;idx++) bitmap[idx] = ~(bitmap[idx]); | |
2756 | } | |
2757 | __CFCSetAllocateAnnexForPlane(theSet, 0); // We need to alloc annex to invert | |
2758 | } else if (__CFCSetClassType(theSet) == __kCFCharSetClassCompactBitmap) { | |
2759 | uint8_t *bitmap = __CFCSetCompactBitmapBits(theSet); | |
2760 | int idx; | |
2761 | int length = 0; | |
2762 | uint8_t value; | |
2763 | ||
2764 | for (idx = 0;idx < __kCFCompactBitmapNumPages;idx++) { | |
2765 | value = bitmap[idx]; | |
2766 | ||
2767 | if (value == 0) { | |
2768 | bitmap[idx] = UINT8_MAX; | |
2769 | } else if (value == UINT8_MAX) { | |
2770 | bitmap[idx] = 0; | |
2771 | } else { | |
2772 | length += __kCFCompactBitmapPageSize; | |
2773 | } | |
2774 | } | |
2775 | bitmap += __kCFCompactBitmapNumPages; | |
2776 | for (idx = 0;idx < length;idx++) bitmap[idx] = ~(bitmap[idx]); | |
2777 | __CFCSetAllocateAnnexForPlane(theSet, 0); // We need to alloc annex to invert | |
2778 | } else { | |
2779 | __CFCSetPutIsInverted(theSet, !__CFCSetIsInverted(theSet)); | |
2780 | } | |
2781 | __CFCSetAnnexSetIsInverted(theSet, !__CFCSetAnnexIsInverted(theSet)); | |
2782 | } | |
2783 | ||
2784 | void CFCharacterSetCompact(CFMutableCharacterSetRef theSet) { | |
2785 | if (__CFCSetIsBitmap(theSet) && __CFCSetBitmapBits(theSet)) __CFCSetMakeCompact(theSet); | |
2786 | if (__CFCSetHasNonBMPPlane(theSet)) { | |
2787 | CFMutableCharacterSetRef annex; | |
2788 | int idx; | |
2789 | ||
2790 | for (idx = 1;idx <= MAX_ANNEX_PLANE;idx++) { | |
2791 | if ((annex = (CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSetNoAlloc(theSet, idx)) && __CFCSetIsBitmap(annex) && __CFCSetBitmapBits(annex)) { | |
2792 | __CFCSetMakeCompact(annex); | |
2793 | } | |
2794 | } | |
2795 | } | |
2796 | } | |
2797 | ||
2798 | void CFCharacterSetFast(CFMutableCharacterSetRef theSet) { | |
2799 | if (__CFCSetIsCompactBitmap(theSet) && __CFCSetCompactBitmapBits(theSet)) __CFCSetMakeBitmap(theSet); | |
2800 | if (__CFCSetHasNonBMPPlane(theSet)) { | |
2801 | CFMutableCharacterSetRef annex; | |
2802 | int idx; | |
2803 | ||
2804 | for (idx = 1;idx <= MAX_ANNEX_PLANE;idx++) { | |
2805 | if ((annex = (CFMutableCharacterSetRef)__CFCSetGetAnnexPlaneCharacterSetNoAlloc(theSet, idx)) && __CFCSetIsCompactBitmap(annex) && __CFCSetCompactBitmapBits(annex)) { | |
2806 | __CFCSetMakeBitmap(annex); | |
2807 | } | |
2808 | } | |
2809 | } | |
2810 | } | |
2811 | ||
2812 | /* Keyed-coding support | |
2813 | */ | |
2814 | CFCharacterSetKeyedCodingType _CFCharacterSetGetKeyedCodingType(CFCharacterSetRef cset) { | |
cf7d2af9 A |
2815 | if (CF_IS_OBJC(__kCFCharacterSetTypeID, cset)) return kCFCharacterSetKeyedCodingTypeBitmap; |
2816 | ||
9ce05555 | 2817 | switch (__CFCSetClassType(cset)) { |
bd5b749c | 2818 | case __kCFCharSetClassBuiltin: return ((__CFCSetBuiltinType(cset) < kCFCharacterSetSymbol) ? kCFCharacterSetKeyedCodingTypeBuiltin : kCFCharacterSetKeyedCodingTypeBuiltinAndBitmap); |
9ce05555 A |
2819 | case __kCFCharSetClassRange: return kCFCharacterSetKeyedCodingTypeRange; |
2820 | ||
2821 | case __kCFCharSetClassString: // We have to check if we have non-BMP here | |
bd5b749c | 2822 | if (!__CFCSetHasNonBMPPlane(cset) && !__CFCSetAnnexIsInverted(cset)) return kCFCharacterSetKeyedCodingTypeString; // BMP only. we can archive the string |
9ce05555 A |
2823 | /* fallthrough */ |
2824 | ||
2825 | default: | |
2826 | return kCFCharacterSetKeyedCodingTypeBitmap; | |
2827 | } | |
2828 | } | |
2829 | ||
9ce05555 A |
2830 | CFCharacterSetPredefinedSet _CFCharacterSetGetKeyedCodingBuiltinType(CFCharacterSetRef cset) { return __CFCSetBuiltinType(cset); } |
2831 | CFRange _CFCharacterSetGetKeyedCodingRange(CFCharacterSetRef cset) { return CFRangeMake(__CFCSetRangeFirstChar(cset), __CFCSetRangeLength(cset)); } | |
bd5b749c | 2832 | CFStringRef _CFCharacterSetCreateKeyedCodingString(CFCharacterSetRef cset) { return CFStringCreateWithCharacters(kCFAllocatorSystemDefault, __CFCSetStringBuffer(cset), __CFCSetStringLength(cset)); } |
9ce05555 | 2833 | |
bd5b749c | 2834 | bool _CFCharacterSetIsInverted(CFCharacterSetRef cset) { return (__CFCSetIsInverted(cset) != 0); } |
9ce05555 A |
2835 | void _CFCharacterSetSetIsInverted(CFCharacterSetRef cset, bool flag) { __CFCSetPutIsInverted((CFMutableCharacterSetRef)cset, flag); } |
2836 | ||
bd5b749c A |
2837 | /* Inline buffer support |
2838 | */ | |
2839 | void CFCharacterSetInitInlineBuffer(CFCharacterSetRef cset, CFCharacterSetInlineBuffer *buffer) { | |
2840 | memset(buffer, 0, sizeof(CFCharacterSetInlineBuffer)); | |
2841 | buffer->cset = cset; | |
2842 | buffer->rangeLimit = 0x10000; | |
2843 | ||
2844 | if (CF_IS_OBJC(__kCFCharacterSetTypeID, cset)) { | |
2845 | CFCharacterSetRef expandedSet = __CFCharacterSetGetExpandedSetForNSCharacterSet(cset); | |
2846 | ||
2847 | if (NULL == expandedSet) { | |
2848 | buffer->flags = kCFCharacterSetNoBitmapAvailable; | |
2849 | buffer->rangeLimit = 0x110000; | |
9ce05555 | 2850 | |
bd5b749c A |
2851 | return; |
2852 | } else { | |
2853 | cset = expandedSet; | |
2854 | } | |
2855 | } | |
2856 | ||
2857 | switch (__CFCSetClassType(cset)) { | |
2858 | case __kCFCharSetClassBuiltin: | |
2859 | buffer->bitmap = CFUniCharGetBitmapPtrForPlane(__CFCSetBuiltinType(cset), 0); | |
2860 | buffer->rangeLimit = 0x110000; | |
2861 | if (NULL == buffer->bitmap) { | |
2862 | buffer->flags = kCFCharacterSetNoBitmapAvailable; | |
2863 | } else { | |
2864 | if (__CFCSetIsInverted(cset)) buffer->flags = kCFCharacterSetIsInverted; | |
2865 | } | |
2866 | break; | |
2867 | ||
2868 | case __kCFCharSetClassRange: | |
2869 | buffer->rangeStart = __CFCSetRangeFirstChar(cset); | |
2870 | buffer->rangeLimit = __CFCSetRangeFirstChar(cset) + __CFCSetRangeLength(cset); | |
2871 | if (__CFCSetIsInverted(cset)) buffer->flags = kCFCharacterSetIsInverted; | |
2872 | return; | |
2873 | ||
2874 | case __kCFCharSetClassString: | |
2875 | buffer->flags = kCFCharacterSetNoBitmapAvailable; | |
2876 | if (__CFCSetStringLength(cset) > 0) { | |
2877 | buffer->rangeStart = *__CFCSetStringBuffer(cset); | |
2878 | buffer->rangeLimit = *(__CFCSetStringBuffer(cset) + __CFCSetStringLength(cset) - 1) + 1; | |
2879 | ||
2880 | if (__CFCSetIsInverted(cset)) { | |
2881 | if (0 == buffer->rangeStart) { | |
2882 | buffer->rangeStart = buffer->rangeLimit; | |
2883 | buffer->rangeLimit = 0x10000; | |
2884 | } else if (0x10000 == buffer->rangeLimit) { | |
2885 | buffer->rangeLimit = buffer->rangeStart; | |
2886 | buffer->rangeStart = 0; | |
2887 | } else { | |
2888 | buffer->rangeStart = 0; | |
2889 | buffer->rangeLimit = 0x10000; | |
2890 | } | |
2891 | } | |
2892 | } | |
2893 | break; | |
2894 | ||
2895 | case __kCFCharSetClassBitmap: | |
2896 | case __kCFCharSetClassCompactBitmap: | |
2897 | buffer->bitmap = __CFCSetCompactBitmapBits(cset); | |
2898 | if (NULL == buffer->bitmap) { | |
2899 | buffer->flags = kCFCharacterSetIsCompactBitmap; | |
2900 | if (__CFCSetIsInverted(cset)) buffer->flags |= kCFCharacterSetIsInverted; | |
2901 | } else { | |
2902 | if (__kCFCharSetClassCompactBitmap == __CFCSetClassType(cset)) buffer->flags = kCFCharacterSetIsCompactBitmap; | |
2903 | } | |
2904 | break; | |
2905 | ||
2906 | default: | |
2907 | CFAssert1(0, __kCFLogAssertion, "%s: Internal inconsistency error: unknown character set type", __PRETTY_FUNCTION__); // We should never come here | |
2908 | return; | |
2909 | } | |
2910 | ||
2911 | if (__CFCSetAnnexIsInverted(cset)) { | |
2912 | buffer->rangeLimit = 0x110000; | |
2913 | } else if (__CFCSetHasNonBMPPlane(cset)) { | |
2914 | CFIndex index; | |
2915 | ||
2916 | for (index = MAX_ANNEX_PLANE;index > 0;index--) { | |
2917 | if (NULL != __CFCSetGetAnnexPlaneCharacterSetNoAlloc(cset, index)) { | |
2918 | buffer->rangeLimit = (index + 1) << 16; | |
2919 | break; | |
2920 | } | |
2921 | } | |
2922 | } | |
2923 | } |