]>
git.saurik.com Git - apple/javascriptcore.git/blob - wtf/unicode/qt4/UnicodeQt4.h
f65e2920fd2f57871c631ad84d97fb2290777234
2 * Copyright (C) 2006 George Staikos <staikos@kde.org>
3 * Copyright (C) 2006 Alexey Proskuryakov <ap@nypop.com>
4 * Copyright (C) 2006, 2007, 2008, 2009 Apple Inc. All rights reserved.
6 * This library is free software; you can redistribute it and/or
7 * modify it under the terms of the GNU Library General Public
8 * License as published by the Free Software Foundation; either
9 * version 2 of the License, or (at your option) any later version.
11 * This library is distributed in the hope that it will be useful,
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14 * Library General Public License for more details.
16 * You should have received a copy of the GNU Library General Public License
17 * along with this library; see the file COPYING.LIB. If not, write to
18 * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
19 * Boston, MA 02110-1301, USA.
23 #ifndef WTF_UNICODE_QT4_H
24 #define WTF_UNICODE_QT4_H
33 #if QT_VERSION >= 0x040300
35 namespace QUnicodeTables
{
38 ushort line_break_class
: 8;
40 ushort combiningClass
:8;
42 signed short digitValue
: 6; /* 5 needed */
43 ushort unicodeVersion
: 4;
44 ushort lowerCaseSpecial
: 1;
45 ushort upperCaseSpecial
: 1;
46 ushort titleCaseSpecial
: 1;
47 ushort caseFoldSpecial
: 1; /* currently unused */
48 signed short mirrorDiff
: 16;
49 signed short lowerCaseDiff
: 16;
50 signed short upperCaseDiff
: 16;
51 signed short titleCaseDiff
: 16;
52 signed short caseFoldDiff
: 16;
54 Q_CORE_EXPORT
const Properties
* QT_FASTCALL
properties(uint ucs4
);
55 Q_CORE_EXPORT
const Properties
* QT_FASTCALL
properties(ushort ucs2
);
60 // ugly hack to make UChar compatible with JSChar in API/JSStringRef.h
62 typedef wchar_t UChar
;
64 typedef uint16_t UChar
;
66 typedef uint32_t UChar32
;
68 // some defines from ICU
70 #define U16_IS_LEAD(c) (((c)&0xfffffc00)==0xd800)
71 #define U16_IS_TRAIL(c) (((c)&0xfffffc00)==0xdc00)
72 #define U16_SURROGATE_OFFSET ((0xd800<<10UL)+0xdc00-0x10000)
73 #define U16_GET_SUPPLEMENTARY(lead, trail) \
74 (((UChar32)(lead)<<10UL)+(UChar32)(trail)-U16_SURROGATE_OFFSET)
76 #define U16_LEAD(supplementary) (UChar)(((supplementary)>>10)+0xd7c0)
77 #define U16_TRAIL(supplementary) (UChar)(((supplementary)&0x3ff)|0xdc00)
79 #define U_IS_SURROGATE(c) (((c)&0xfffff800)==0xd800)
80 #define U16_IS_SINGLE(c) !U_IS_SURROGATE(c)
81 #define U16_IS_SURROGATE(c) U_IS_SURROGATE(c)
82 #define U16_IS_SURROGATE_LEAD(c) (((c)&0x400)==0)
84 #define U16_NEXT(s, i, length, c) { \
86 if(U16_IS_LEAD(c)) { \
88 if((i)<(length) && U16_IS_TRAIL(__c2=(s)[(i)])) { \
90 (c)=U16_GET_SUPPLEMENTARY((c), __c2); \
95 #define U_MASK(x) ((uint32_t)1<<(x))
101 LeftToRight
= QChar::DirL
,
102 RightToLeft
= QChar::DirR
,
103 EuropeanNumber
= QChar::DirEN
,
104 EuropeanNumberSeparator
= QChar::DirES
,
105 EuropeanNumberTerminator
= QChar::DirET
,
106 ArabicNumber
= QChar::DirAN
,
107 CommonNumberSeparator
= QChar::DirCS
,
108 BlockSeparator
= QChar::DirB
,
109 SegmentSeparator
= QChar::DirS
,
110 WhiteSpaceNeutral
= QChar::DirWS
,
111 OtherNeutral
= QChar::DirON
,
112 LeftToRightEmbedding
= QChar::DirLRE
,
113 LeftToRightOverride
= QChar::DirLRO
,
114 RightToLeftArabic
= QChar::DirAL
,
115 RightToLeftEmbedding
= QChar::DirRLE
,
116 RightToLeftOverride
= QChar::DirRLO
,
117 PopDirectionalFormat
= QChar::DirPDF
,
118 NonSpacingMark
= QChar::DirNSM
,
119 BoundaryNeutral
= QChar::DirBN
122 enum DecompositionType
{
123 DecompositionNone
= QChar::NoDecomposition
,
124 DecompositionCanonical
= QChar::Canonical
,
125 DecompositionCompat
= QChar::Compat
,
126 DecompositionCircle
= QChar::Circle
,
127 DecompositionFinal
= QChar::Final
,
128 DecompositionFont
= QChar::Font
,
129 DecompositionFraction
= QChar::Fraction
,
130 DecompositionInitial
= QChar::Initial
,
131 DecompositionIsolated
= QChar::Isolated
,
132 DecompositionMedial
= QChar::Medial
,
133 DecompositionNarrow
= QChar::Narrow
,
134 DecompositionNoBreak
= QChar::NoBreak
,
135 DecompositionSmall
= QChar::Small
,
136 DecompositionSquare
= QChar::Square
,
137 DecompositionSub
= QChar::Sub
,
138 DecompositionSuper
= QChar::Super
,
139 DecompositionVertical
= QChar::Vertical
,
140 DecompositionWide
= QChar::Wide
145 Mark_NonSpacing
= U_MASK(QChar::Mark_NonSpacing
),
146 Mark_SpacingCombining
= U_MASK(QChar::Mark_SpacingCombining
),
147 Mark_Enclosing
= U_MASK(QChar::Mark_Enclosing
),
148 Number_DecimalDigit
= U_MASK(QChar::Number_DecimalDigit
),
149 Number_Letter
= U_MASK(QChar::Number_Letter
),
150 Number_Other
= U_MASK(QChar::Number_Other
),
151 Separator_Space
= U_MASK(QChar::Separator_Space
),
152 Separator_Line
= U_MASK(QChar::Separator_Line
),
153 Separator_Paragraph
= U_MASK(QChar::Separator_Paragraph
),
154 Other_Control
= U_MASK(QChar::Other_Control
),
155 Other_Format
= U_MASK(QChar::Other_Format
),
156 Other_Surrogate
= U_MASK(QChar::Other_Surrogate
),
157 Other_PrivateUse
= U_MASK(QChar::Other_PrivateUse
),
158 Other_NotAssigned
= U_MASK(QChar::Other_NotAssigned
),
159 Letter_Uppercase
= U_MASK(QChar::Letter_Uppercase
),
160 Letter_Lowercase
= U_MASK(QChar::Letter_Lowercase
),
161 Letter_Titlecase
= U_MASK(QChar::Letter_Titlecase
),
162 Letter_Modifier
= U_MASK(QChar::Letter_Modifier
),
163 Letter_Other
= U_MASK(QChar::Letter_Other
),
164 Punctuation_Connector
= U_MASK(QChar::Punctuation_Connector
),
165 Punctuation_Dash
= U_MASK(QChar::Punctuation_Dash
),
166 Punctuation_Open
= U_MASK(QChar::Punctuation_Open
),
167 Punctuation_Close
= U_MASK(QChar::Punctuation_Close
),
168 Punctuation_InitialQuote
= U_MASK(QChar::Punctuation_InitialQuote
),
169 Punctuation_FinalQuote
= U_MASK(QChar::Punctuation_FinalQuote
),
170 Punctuation_Other
= U_MASK(QChar::Punctuation_Other
),
171 Symbol_Math
= U_MASK(QChar::Symbol_Math
),
172 Symbol_Currency
= U_MASK(QChar::Symbol_Currency
),
173 Symbol_Modifier
= U_MASK(QChar::Symbol_Modifier
),
174 Symbol_Other
= U_MASK(QChar::Symbol_Other
)
178 #if QT_VERSION >= 0x040300
180 // FIXME: handle surrogates correctly in all methods
182 inline UChar32
toLower(UChar32 ch
)
184 return QChar::toLower(ch
);
187 inline int toLower(UChar
* result
, int resultLength
, const UChar
* src
, int srcLength
, bool* error
)
189 const UChar
*e
= src
+ srcLength
;
190 const UChar
*s
= src
;
194 // this avoids one out of bounds check in the loop
195 if (s
< e
&& QChar(*s
).isLowSurrogate()) {
202 while (s
< e
&& (rindex
< uint(resultLength
) || !r
)) {
204 if (QChar(c
).isLowSurrogate() && QChar(*(s
- 1)).isHighSurrogate())
205 c
= QChar::surrogateToUcs4(*(s
- 1), c
);
206 const QUnicodeTables::Properties
*prop
= QUnicodeTables::properties(c
);
207 if (prop
->lowerCaseSpecial
) {
212 qstring
+= QChar(*(s
-1));
213 qstring
+= QChar(*s
);
215 qstring
= qstring
.toLower();
216 for (int i
= 0; i
< qstring
.length(); ++i
) {
217 if (rindex
>= uint(resultLength
)) {
218 needed
+= qstring
.length() - i
;
222 r
[rindex
] = qstring
.at(i
).unicode();
227 r
[rindex
] = *s
+ prop
->lowerCaseDiff
;
234 *error
= (needed
!= 0);
235 if (rindex
< uint(resultLength
))
237 return rindex
+ needed
;
240 inline UChar32
toUpper(UChar32 ch
)
242 return QChar::toUpper(ch
);
245 inline int toUpper(UChar
* result
, int resultLength
, const UChar
* src
, int srcLength
, bool* error
)
247 const UChar
*e
= src
+ srcLength
;
248 const UChar
*s
= src
;
252 // this avoids one out of bounds check in the loop
253 if (s
< e
&& QChar(*s
).isLowSurrogate()) {
260 while (s
< e
&& (rindex
< resultLength
|| !r
)) {
262 if (QChar(c
).isLowSurrogate() && QChar(*(s
- 1)).isHighSurrogate())
263 c
= QChar::surrogateToUcs4(*(s
- 1), c
);
264 const QUnicodeTables::Properties
*prop
= QUnicodeTables::properties(c
);
265 if (prop
->upperCaseSpecial
) {
270 qstring
+= QChar(*(s
-1));
271 qstring
+= QChar(*s
);
273 qstring
= qstring
.toUpper();
274 for (int i
= 0; i
< qstring
.length(); ++i
) {
275 if (rindex
>= resultLength
) {
276 needed
+= qstring
.length() - i
;
280 r
[rindex
] = qstring
.at(i
).unicode();
285 r
[rindex
] = *s
+ prop
->upperCaseDiff
;
292 *error
= (needed
!= 0);
293 if (rindex
< resultLength
)
295 return rindex
+ needed
;
298 inline int toTitleCase(UChar32 c
)
300 return QChar::toTitleCase(c
);
303 inline UChar32
foldCase(UChar32 c
)
305 return QChar::toCaseFolded(c
);
308 inline int foldCase(UChar
* result
, int resultLength
, const UChar
* src
, int srcLength
, bool* error
)
310 // FIXME: handle special casing. Easiest with some low level API in Qt
312 if (resultLength
< srcLength
) {
316 for (int i
= 0; i
< srcLength
; ++i
)
317 result
[i
] = QChar::toCaseFolded(ushort(src
[i
]));
321 inline bool isArabicChar(UChar32 c
)
323 return c
>= 0x0600 && c
<= 0x06FF;
326 inline bool isPrintableChar(UChar32 c
)
328 const uint test
= U_MASK(QChar::Other_Control
) |
329 U_MASK(QChar::Other_NotAssigned
);
330 return !(U_MASK(QChar::category(c
)) & test
);
333 inline bool isSeparatorSpace(UChar32 c
)
335 return QChar::category(c
) == QChar::Separator_Space
;
338 inline bool isPunct(UChar32 c
)
340 const uint test
= U_MASK(QChar::Punctuation_Connector
) |
341 U_MASK(QChar::Punctuation_Dash
) |
342 U_MASK(QChar::Punctuation_Open
) |
343 U_MASK(QChar::Punctuation_Close
) |
344 U_MASK(QChar::Punctuation_InitialQuote
) |
345 U_MASK(QChar::Punctuation_FinalQuote
) |
346 U_MASK(QChar::Punctuation_Other
);
347 return U_MASK(QChar::category(c
)) & test
;
350 inline bool isLower(UChar32 c
)
352 return QChar::category(c
) == QChar::Letter_Lowercase
;
355 inline bool hasLineBreakingPropertyComplexContext(UChar32
)
357 // FIXME: Implement this to return whether the character has line breaking property SA (Complex Context).
361 inline UChar32
mirroredChar(UChar32 c
)
363 return QChar::mirroredChar(c
);
366 inline uint8_t combiningClass(UChar32 c
)
368 return QChar::combiningClass(c
);
371 inline DecompositionType
decompositionType(UChar32 c
)
373 return (DecompositionType
)QChar::decompositionTag(c
);
376 inline int umemcasecmp(const UChar
* a
, const UChar
* b
, int len
)
378 // handle surrogates correctly
379 for (int i
= 0; i
< len
; ++i
) {
380 uint c1
= QChar::toCaseFolded(ushort(a
[i
]));
381 uint c2
= QChar::toCaseFolded(ushort(b
[i
]));
388 inline Direction
direction(UChar32 c
)
390 return (Direction
)QChar::direction(c
);
393 inline CharCategory
category(UChar32 c
)
395 return (CharCategory
) U_MASK(QChar::category(c
));
400 inline UChar32
toLower(UChar32 ch
)
404 return QChar((unsigned short)ch
).toLower().unicode();
407 inline int toLower(UChar
* result
, int resultLength
, const UChar
* src
, int srcLength
, bool* error
)
410 if (resultLength
< srcLength
) {
414 for (int i
= 0; i
< srcLength
; ++i
)
415 result
[i
] = QChar(src
[i
]).toLower().unicode();
419 inline UChar32
toUpper(UChar32 ch
)
423 return QChar((unsigned short)ch
).toUpper().unicode();
426 inline int toUpper(UChar
* result
, int resultLength
, const UChar
* src
, int srcLength
, bool* error
)
429 if (resultLength
< srcLength
) {
433 for (int i
= 0; i
< srcLength
; ++i
)
434 result
[i
] = QChar(src
[i
]).toUpper().unicode();
438 inline int toTitleCase(UChar32 c
)
442 return QChar((unsigned short)c
).toUpper().unicode();
445 inline UChar32
foldCase(UChar32 c
)
449 return QChar((unsigned short)c
).toLower().unicode();
452 inline int foldCase(UChar
* result
, int resultLength
, const UChar
* src
, int srcLength
, bool* error
)
454 return toLower(result
, resultLength
, src
, srcLength
, error
);
457 inline bool isPrintableChar(UChar32 c
)
459 return (c
& 0xffff0000) == 0 && QChar((unsigned short)c
).isPrint();
462 inline bool isArabicChar(UChar32 c
)
464 return c
>= 0x0600 && c
<= 0x06FF;
467 inline bool isSeparatorSpace(UChar32 c
)
469 return (c
& 0xffff0000) == 0 && QChar((unsigned short)c
).category() == QChar::Separator_Space
;
472 inline bool isPunct(UChar32 c
)
474 return (c
& 0xffff0000) == 0 && QChar((unsigned short)c
).isPunct();
477 inline bool isLower(UChar32 c
)
479 return (c
& 0xffff0000) == 0 && QChar((unsigned short)c
).category() == QChar::Letter_Lowercase
;
482 inline UChar32
mirroredChar(UChar32 c
)
486 return QChar(c
).mirroredChar().unicode();
489 inline uint8_t combiningClass(UChar32 c
)
493 return QChar((unsigned short)c
).combiningClass();
496 inline DecompositionType
decompositionType(UChar32 c
)
499 return DecompositionNone
;
500 return (DecompositionType
)QChar(c
).decompositionTag();
503 inline int umemcasecmp(const UChar
* a
, const UChar
* b
, int len
)
505 for (int i
= 0; i
< len
; ++i
) {
506 QChar c1
= QChar(a
[i
]).toLower();
507 QChar c2
= QChar(b
[i
]).toLower();
509 return c1
.unicode() - c2
.unicode();
514 inline Direction
direction(UChar32 c
)
518 return (Direction
)QChar(c
).direction();
521 inline CharCategory
category(UChar32 c
)
525 return (CharCategory
) U_MASK(QChar(c
).category());
532 #endif // WTF_UNICODE_QT4_H