]> git.saurik.com Git - apple/javascriptcore.git/blame - wtf/unicode/glib/UnicodeGLib.cpp
JavaScriptCore-621.1.tar.gz
[apple/javascriptcore.git] / wtf / unicode / glib / UnicodeGLib.cpp
CommitLineData
ba379fdc
A
1/*
2 * Copyright (C) 2008 Jürg Billeter <j@bitron.ch>
3 * Copyright (C) 2008 Dominik Röttsches <dominik.roettsches@access-company.com>
4 *
5 * This library is free software; you can redistribute it and/or
6 * modify it under the terms of the GNU Library General Public
7 * License as published by the Free Software Foundation; either
8 * version 2 of the License, or (at your option) any later version.
9 *
10 * This library is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * Library General Public License for more details.
14 *
15 * You should have received a copy of the GNU Library General Public License
16 * along with this library; see the file COPYING.LIB. If not, write to
17 * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
18 * Boston, MA 02110-1301, USA.
19 *
20 */
21
f9bf01c6 22#include "config.h"
ba379fdc
A
23#include "UnicodeGLib.h"
24
25namespace WTF {
26namespace Unicode {
27
28UChar32 foldCase(UChar32 ch)
29{
30 GOwnPtr<GError> gerror;
31
32 GOwnPtr<char> utf8char;
33 utf8char.set(g_ucs4_to_utf8(reinterpret_cast<gunichar*>(&ch), 1, 0, 0, &gerror.outPtr()));
34 if (gerror)
35 return ch;
36
37 GOwnPtr<char> utf8caseFolded;
38 utf8caseFolded.set(g_utf8_casefold(utf8char.get(), -1));
39
40 GOwnPtr<gunichar> ucs4Result;
41 ucs4Result.set(g_utf8_to_ucs4_fast(utf8caseFolded.get(), -1, 0));
42
43 return *ucs4Result;
44}
45
46int foldCase(UChar* result, int resultLength, const UChar* src, int srcLength, bool* error)
47{
48 *error = false;
49 GOwnPtr<GError> gerror;
50
51 GOwnPtr<char> utf8src;
52 utf8src.set(g_utf16_to_utf8(src, srcLength, 0, 0, &gerror.outPtr()));
53 if (gerror) {
54 *error = true;
55 return -1;
56 }
57
58 GOwnPtr<char> utf8result;
59 utf8result.set(g_utf8_casefold(utf8src.get(), -1));
60
61 long utf16resultLength = -1;
62 GOwnPtr<UChar> utf16result;
63 utf16result.set(g_utf8_to_utf16(utf8result.get(), -1, 0, &utf16resultLength, &gerror.outPtr()));
64 if (gerror) {
65 *error = true;
66 return -1;
67 }
68
69 if (utf16resultLength > resultLength) {
70 *error = true;
71 return utf16resultLength;
72 }
73 memcpy(result, utf16result.get(), utf16resultLength * sizeof(UChar));
74
75 return utf16resultLength;
76}
77
78int toLower(UChar* result, int resultLength, const UChar* src, int srcLength, bool* error)
79{
80 *error = false;
81 GOwnPtr<GError> gerror;
82
83 GOwnPtr<char> utf8src;
84 utf8src.set(g_utf16_to_utf8(src, srcLength, 0, 0, &gerror.outPtr()));
85 if (gerror) {
86 *error = true;
87 return -1;
88 }
89
90 GOwnPtr<char> utf8result;
91 utf8result.set(g_utf8_strdown(utf8src.get(), -1));
92
93 long utf16resultLength = -1;
94 GOwnPtr<UChar> utf16result;
95 utf16result.set(g_utf8_to_utf16(utf8result.get(), -1, 0, &utf16resultLength, &gerror.outPtr()));
96 if (gerror) {
97 *error = true;
98 return -1;
99 }
100
101 if (utf16resultLength > resultLength) {
102 *error = true;
103 return utf16resultLength;
104 }
105 memcpy(result, utf16result.get(), utf16resultLength * sizeof(UChar));
106
107 return utf16resultLength;
108}
109
110int toUpper(UChar* result, int resultLength, const UChar* src, int srcLength, bool* error)
111{
112 *error = false;
113 GOwnPtr<GError> gerror;
114
115 GOwnPtr<char> utf8src;
116 utf8src.set(g_utf16_to_utf8(src, srcLength, 0, 0, &gerror.outPtr()));
117 if (gerror) {
118 *error = true;
119 return -1;
120 }
121
122 GOwnPtr<char> utf8result;
123 utf8result.set(g_utf8_strup(utf8src.get(), -1));
124
125 long utf16resultLength = -1;
126 GOwnPtr<UChar> utf16result;
127 utf16result.set(g_utf8_to_utf16(utf8result.get(), -1, 0, &utf16resultLength, &gerror.outPtr()));
128 if (gerror) {
129 *error = true;
130 return -1;
131 }
132
133 if (utf16resultLength > resultLength) {
134 *error = true;
135 return utf16resultLength;
136 }
137 memcpy(result, utf16result.get(), utf16resultLength * sizeof(UChar));
138
139 return utf16resultLength;
140}
141
142Direction direction(UChar32 c)
143{
144 PangoBidiType type = pango_bidi_type_for_unichar(c);
145 switch (type) {
146 case PANGO_BIDI_TYPE_L:
147 return LeftToRight;
148 case PANGO_BIDI_TYPE_R:
149 return RightToLeft;
150 case PANGO_BIDI_TYPE_AL:
151 return RightToLeftArabic;
152 case PANGO_BIDI_TYPE_LRE:
153 return LeftToRightEmbedding;
154 case PANGO_BIDI_TYPE_RLE:
155 return RightToLeftEmbedding;
156 case PANGO_BIDI_TYPE_LRO:
157 return LeftToRightOverride;
158 case PANGO_BIDI_TYPE_RLO:
159 return RightToLeftOverride;
160 case PANGO_BIDI_TYPE_PDF:
161 return PopDirectionalFormat;
162 case PANGO_BIDI_TYPE_EN:
163 return EuropeanNumber;
164 case PANGO_BIDI_TYPE_AN:
165 return ArabicNumber;
166 case PANGO_BIDI_TYPE_ES:
167 return EuropeanNumberSeparator;
168 case PANGO_BIDI_TYPE_ET:
169 return EuropeanNumberTerminator;
170 case PANGO_BIDI_TYPE_CS:
171 return CommonNumberSeparator;
172 case PANGO_BIDI_TYPE_NSM:
173 return NonSpacingMark;
174 case PANGO_BIDI_TYPE_BN:
175 return BoundaryNeutral;
176 case PANGO_BIDI_TYPE_B:
177 return BlockSeparator;
178 case PANGO_BIDI_TYPE_S:
179 return SegmentSeparator;
180 case PANGO_BIDI_TYPE_WS:
181 return WhiteSpaceNeutral;
182 default:
183 return OtherNeutral;
184 }
185}
186
187int umemcasecmp(const UChar* a, const UChar* b, int len)
188{
189 GOwnPtr<char> utf8a;
190 GOwnPtr<char> utf8b;
191
192 utf8a.set(g_utf16_to_utf8(a, len, 0, 0, 0));
193 utf8b.set(g_utf16_to_utf8(b, len, 0, 0, 0));
194
195 GOwnPtr<char> foldedA;
196 GOwnPtr<char> foldedB;
197
198 foldedA.set(g_utf8_casefold(utf8a.get(), -1));
199 foldedB.set(g_utf8_casefold(utf8b.get(), -1));
200
201 // FIXME: umemcasecmp needs to mimic u_memcasecmp of icu
202 // from the ICU docs:
203 // "Compare two strings case-insensitively using full case folding.
204 // his is equivalent to u_strcmp(u_strFoldCase(s1, n, options), u_strFoldCase(s2, n, options))."
205 //
206 // So it looks like we don't need the full g_utf8_collate here,
207 // but really a bitwise comparison of casefolded unicode chars (not utf-8 bytes).
208 // As there is no direct equivalent to this icu function in GLib, for now
209 // we'll use g_utf8_collate():
210
211 return g_utf8_collate(foldedA.get(), foldedB.get());
212}
213
214}
215}