]>
Commit | Line | Data |
---|---|---|
1 | /* | |
2 | ******************************************************************************* | |
3 | * | |
4 | * Copyright (C) 2003-2010, International Business Machines | |
5 | * Corporation and others. All Rights Reserved. | |
6 | * | |
7 | ******************************************************************************* | |
8 | * file name: usprep.h | |
9 | * encoding: US-ASCII | |
10 | * tab size: 8 (not used) | |
11 | * indentation:4 | |
12 | * | |
13 | * created on: 2003jul2 | |
14 | * created by: Ram Viswanadha | |
15 | */ | |
16 | ||
17 | #ifndef __USPREP_H__ | |
18 | #define __USPREP_H__ | |
19 | ||
20 | /** | |
21 | * \file | |
22 | * \brief C API: Implements the StringPrep algorithm. | |
23 | */ | |
24 | ||
25 | #include "unicode/utypes.h" | |
26 | #include "unicode/localpointer.h" | |
27 | ||
28 | /** | |
29 | * | |
30 | * StringPrep API implements the StingPrep framework as described by RFC 3454. | |
31 | * StringPrep prepares Unicode strings for use in network protocols. | |
32 | * Profiles of StingPrep are set of rules and data according to with the | |
33 | * Unicode Strings are prepared. Each profiles contains tables which describe | |
34 | * how a code point should be treated. The tables are broadly classied into | |
35 | * <ul> | |
36 | * <li> Unassinged Table: Contains code points that are unassigned | |
37 | * in the Unicode Version supported by StringPrep. Currently | |
38 | * RFC 3454 supports Unicode 3.2. </li> | |
39 | * <li> Prohibited Table: Contains code points that are prohibted from | |
40 | * the output of the StringPrep processing function. </li> | |
41 | * <li> Mapping Table: Contains code ponts that are deleted from the output or case mapped. </li> | |
42 | * </ul> | |
43 | * | |
44 | * The procedure for preparing Unicode strings: | |
45 | * <ol> | |
46 | * <li> Map: For each character in the input, check if it has a mapping | |
47 | * and, if so, replace it with its mapping. </li> | |
48 | * <li> Normalize: Possibly normalize the result of step 1 using Unicode | |
49 | * normalization. </li> | |
50 | * <li> Prohibit: Check for any characters that are not allowed in the | |
51 | * output. If any are found, return an error.</li> | |
52 | * <li> Check bidi: Possibly check for right-to-left characters, and if | |
53 | * any are found, make sure that the whole string satisfies the | |
54 | * requirements for bidirectional strings. If the string does not | |
55 | * satisfy the requirements for bidirectional strings, return an | |
56 | * error. </li> | |
57 | * </ol> | |
58 | * @author Ram Viswanadha | |
59 | */ | |
60 | #if !UCONFIG_NO_IDNA | |
61 | ||
62 | #include "unicode/parseerr.h" | |
63 | ||
64 | /** | |
65 | * The StringPrep profile | |
66 | * @stable ICU 2.8 | |
67 | */ | |
68 | typedef struct UStringPrepProfile UStringPrepProfile; | |
69 | ||
70 | ||
71 | /** | |
72 | * Option to prohibit processing of unassigned code points in the input | |
73 | * | |
74 | * @see usprep_prepare | |
75 | * @stable ICU 2.8 | |
76 | */ | |
77 | #define USPREP_DEFAULT 0x0000 | |
78 | ||
79 | /** | |
80 | * Option to allow processing of unassigned code points in the input | |
81 | * | |
82 | * @see usprep_prepare | |
83 | * @stable ICU 2.8 | |
84 | */ | |
85 | #define USPREP_ALLOW_UNASSIGNED 0x0001 | |
86 | ||
87 | /** | |
88 | * enums for the standard stringprep profile types | |
89 | * supported by usprep_openByType. | |
90 | * @see usprep_openByType | |
91 | * @stable ICU 4.2 | |
92 | */ | |
93 | typedef enum UStringPrepProfileType { | |
94 | /** | |
95 | * RFC3491 Nameprep | |
96 | * @stable ICU 4.2 | |
97 | */ | |
98 | USPREP_RFC3491_NAMEPREP, | |
99 | /** | |
100 | * RFC3530 nfs4_cs_prep | |
101 | * @stable ICU 4.2 | |
102 | */ | |
103 | USPREP_RFC3530_NFS4_CS_PREP, | |
104 | /** | |
105 | * RFC3530 nfs4_cs_prep with case insensitive option | |
106 | * @stable ICU 4.2 | |
107 | */ | |
108 | USPREP_RFC3530_NFS4_CS_PREP_CI, | |
109 | /** | |
110 | * RFC3530 nfs4_cis_prep | |
111 | * @stable ICU 4.2 | |
112 | */ | |
113 | USPREP_RFC3530_NFS4_CIS_PREP, | |
114 | /** | |
115 | * RFC3530 nfs4_mixed_prep for prefix | |
116 | * @stable ICU 4.2 | |
117 | */ | |
118 | USPREP_RFC3530_NFS4_MIXED_PREP_PREFIX, | |
119 | /** | |
120 | * RFC3530 nfs4_mixed_prep for suffix | |
121 | * @stable ICU 4.2 | |
122 | */ | |
123 | USPREP_RFC3530_NFS4_MIXED_PREP_SUFFIX, | |
124 | /** | |
125 | * RFC3722 iSCSI | |
126 | * @stable ICU 4.2 | |
127 | */ | |
128 | USPREP_RFC3722_ISCSI, | |
129 | /** | |
130 | * RFC3920 XMPP Nodeprep | |
131 | * @stable ICU 4.2 | |
132 | */ | |
133 | USPREP_RFC3920_NODEPREP, | |
134 | /** | |
135 | * RFC3920 XMPP Resourceprep | |
136 | * @stable ICU 4.2 | |
137 | */ | |
138 | USPREP_RFC3920_RESOURCEPREP, | |
139 | /** | |
140 | * RFC4011 Policy MIB Stringprep | |
141 | * @stable ICU 4.2 | |
142 | */ | |
143 | USPREP_RFC4011_MIB, | |
144 | /** | |
145 | * RFC4013 SASLprep | |
146 | * @stable ICU 4.2 | |
147 | */ | |
148 | USPREP_RFC4013_SASLPREP, | |
149 | /** | |
150 | * RFC4505 trace | |
151 | * @stable ICU 4.2 | |
152 | */ | |
153 | USPREP_RFC4505_TRACE, | |
154 | /** | |
155 | * RFC4518 LDAP | |
156 | * @stable ICU 4.2 | |
157 | */ | |
158 | USPREP_RFC4518_LDAP, | |
159 | /** | |
160 | * RFC4518 LDAP for case ignore, numeric and stored prefix | |
161 | * matching rules | |
162 | * @stable ICU 4.2 | |
163 | */ | |
164 | USPREP_RFC4518_LDAP_CI | |
165 | } UStringPrepProfileType; | |
166 | ||
167 | /** | |
168 | * Creates a StringPrep profile from the data file. | |
169 | * | |
170 | * @param path string containing the full path pointing to the directory | |
171 | * where the profile reside followed by the package name | |
172 | * e.g. "/usr/resource/my_app/profiles/mydata" on a Unix system. | |
173 | * if NULL, ICU default data files will be used. | |
174 | * @param fileName name of the profile file to be opened | |
175 | * @param status ICU error code in/out parameter. Must not be NULL. | |
176 | * Must fulfill U_SUCCESS before the function call. | |
177 | * @return Pointer to UStringPrepProfile that is opened. Should be closed by | |
178 | * calling usprep_close() | |
179 | * @see usprep_close() | |
180 | * @stable ICU 2.8 | |
181 | */ | |
182 | U_STABLE UStringPrepProfile* U_EXPORT2 | |
183 | usprep_open(const char* path, | |
184 | const char* fileName, | |
185 | UErrorCode* status); | |
186 | ||
187 | /** | |
188 | * Creates a StringPrep profile for the specified profile type. | |
189 | * | |
190 | * @param type The profile type | |
191 | * @param status ICU error code in/out parameter. Must not be NULL. | |
192 | * Must fulfill U_SUCCESS before the function call. | |
193 | * @return Pointer to UStringPrepProfile that is opened. Should be closed by | |
194 | * calling usprep_close() | |
195 | * @see usprep_close() | |
196 | * @stable ICU 4.2 | |
197 | */ | |
198 | U_STABLE UStringPrepProfile* U_EXPORT2 | |
199 | usprep_openByType(UStringPrepProfileType type, | |
200 | UErrorCode* status); | |
201 | ||
202 | /** | |
203 | * Closes the profile | |
204 | * @param profile The profile to close | |
205 | * @stable ICU 2.8 | |
206 | */ | |
207 | U_STABLE void U_EXPORT2 | |
208 | usprep_close(UStringPrepProfile* profile); | |
209 | ||
210 | #if U_SHOW_CPLUSPLUS_API | |
211 | ||
212 | U_NAMESPACE_BEGIN | |
213 | ||
214 | /** | |
215 | * \class LocalUStringPrepProfilePointer | |
216 | * "Smart pointer" class, closes a UStringPrepProfile via usprep_close(). | |
217 | * For most methods see the LocalPointerBase base class. | |
218 | * | |
219 | * @see LocalPointerBase | |
220 | * @see LocalPointer | |
221 | * @stable ICU 4.4 | |
222 | */ | |
223 | U_DEFINE_LOCAL_OPEN_POINTER(LocalUStringPrepProfilePointer, UStringPrepProfile, usprep_close); | |
224 | ||
225 | U_NAMESPACE_END | |
226 | ||
227 | #endif | |
228 | ||
229 | /** | |
230 | * Prepare the input buffer for use in applications with the given profile. This operation maps, normalizes(NFKC), | |
231 | * checks for prohited and BiDi characters in the order defined by RFC 3454 | |
232 | * depending on the options specified in the profile. | |
233 | * | |
234 | * @param prep The profile to use | |
235 | * @param src Pointer to UChar buffer containing the string to prepare | |
236 | * @param srcLength Number of characters in the source string | |
237 | * @param dest Pointer to the destination buffer to receive the output | |
238 | * @param destCapacity The capacity of destination array | |
239 | * @param options A bit set of options: | |
240 | * | |
241 | * - USPREP_NONE Prohibit processing of unassigned code points in the input | |
242 | * | |
243 | * - USPREP_ALLOW_UNASSIGNED Treat the unassigned code points are in the input | |
244 | * as normal Unicode code points. | |
245 | * | |
246 | * @param parseError Pointer to UParseError struct to receive information on position | |
247 | * of error if an error is encountered. Can be NULL. | |
248 | * @param status ICU in/out error code parameter. | |
249 | * U_INVALID_CHAR_FOUND if src contains | |
250 | * unmatched single surrogates. | |
251 | * U_INDEX_OUTOFBOUNDS_ERROR if src contains | |
252 | * too many code points. | |
253 | * U_BUFFER_OVERFLOW_ERROR if destCapacity is not enough | |
254 | * @return The number of UChars in the destination buffer | |
255 | * @stable ICU 2.8 | |
256 | */ | |
257 | ||
258 | U_STABLE int32_t U_EXPORT2 | |
259 | usprep_prepare( const UStringPrepProfile* prep, | |
260 | const UChar* src, int32_t srcLength, | |
261 | UChar* dest, int32_t destCapacity, | |
262 | int32_t options, | |
263 | UParseError* parseError, | |
264 | UErrorCode* status ); | |
265 | ||
266 | ||
267 | #endif /* #if !UCONFIG_NO_IDNA */ | |
268 | ||
269 | #endif |