]>
Commit | Line | Data |
---|---|---|
374ca955 A |
1 | /* |
2 | ******************************************************************************* | |
3 | * | |
73c04bcf | 4 | * Copyright (C) 2003-2005, International Business Machines |
374ca955 A |
5 | * Corporation and others. All Rights Reserved. |
6 | * | |
7 | ******************************************************************************* | |
8 | * file name: udataswp.h | |
9 | * encoding: US-ASCII | |
10 | * tab size: 8 (not used) | |
11 | * indentation:4 | |
12 | * | |
13 | * created on: 2003jun05 | |
14 | * created by: Markus W. Scherer | |
15 | * | |
16 | * Definitions for ICU data transformations for different platforms, | |
17 | * changing between big- and little-endian data and/or between | |
18 | * charset families (ASCII<->EBCDIC). | |
19 | */ | |
20 | ||
21 | #ifndef __UDATASWP_H__ | |
22 | #define __UDATASWP_H__ | |
23 | ||
24 | #include <stdarg.h> | |
25 | #include "unicode/utypes.h" | |
26 | ||
27 | /* forward declaration */ | |
28 | ||
29 | U_CDECL_BEGIN | |
30 | ||
31 | struct UDataSwapper; | |
32 | typedef struct UDataSwapper UDataSwapper; | |
33 | ||
34 | /** | |
35 | * Function type for data transformation. | |
36 | * Transforms data, or just returns the length of the data if | |
37 | * the input length is -1. | |
38 | * Swap functions assume that their data pointers are aligned properly. | |
39 | * | |
40 | * Quick implementation outline: | |
41 | * (best to copy and adapt and existing swapper implementation) | |
42 | * check that the data looks like the expected format | |
43 | * if(length<0) { | |
44 | * preflight: | |
45 | * never dereference outData | |
46 | * read inData and determine the data size | |
47 | * assume that inData is long enough for this | |
48 | * } else { | |
49 | * outData can be NULL if length==0 | |
50 | * inData==outData (in-place swapping) possible but not required! | |
51 | * verify that length>=(actual size) | |
52 | * if there is a chance that not every byte up to size is reached | |
53 | * due to padding etc.: | |
54 | * if(inData!=outData) { | |
55 | * memcpy(outData, inData, actual size); | |
56 | * } | |
57 | * swap contents | |
58 | * } | |
59 | * return actual size | |
60 | * | |
61 | * Further implementation notes: | |
62 | * - read integers from inData before swapping them | |
63 | * because in-place swapping can make them unreadable | |
64 | * - compareInvChars compares a local Unicode string with already-swapped | |
65 | * output charset strings | |
66 | * | |
67 | * @param ds Pointer to UDataSwapper containing global data about the | |
68 | * transformation and function pointers for handling primitive | |
69 | * types. | |
70 | * @param inData Pointer to the input data to be transformed or examined. | |
71 | * @param length Length of the data, counting bytes. May be -1 for preflighting. | |
72 | * If length>=0, then transform the data. | |
73 | * If length==-1, then only determine the length of the data. | |
74 | * The length cannot be determined from the data itself for all | |
75 | * types of data (e.g., not for simple arrays of integers). | |
76 | * @param outData Pointer to the output data buffer. | |
77 | * If length>=0 (transformation), then the output buffer must | |
78 | * have a capacity of at least length. | |
79 | * If length==-1, then outData will not be used and can be NULL. | |
80 | * @param pErrorCode ICU UErrorCode parameter, must not be NULL and must | |
81 | * fulfill U_SUCCESS on input. | |
82 | * @return The actual length of the data. | |
83 | * | |
84 | * @see UDataSwapper | |
73c04bcf | 85 | * @internal ICU 2.8 |
374ca955 A |
86 | */ |
87 | typedef int32_t U_CALLCONV | |
88 | UDataSwapFn(const UDataSwapper *ds, | |
89 | const void *inData, int32_t length, void *outData, | |
90 | UErrorCode *pErrorCode); | |
91 | ||
92 | /** | |
93 | * Convert one uint16_t from input to platform endianness. | |
73c04bcf | 94 | * @internal ICU 2.8 |
374ca955 A |
95 | */ |
96 | typedef uint16_t U_CALLCONV | |
97 | UDataReadUInt16(uint16_t x); | |
98 | ||
99 | /** | |
100 | * Convert one uint32_t from input to platform endianness. | |
73c04bcf | 101 | * @internal ICU 2.8 |
374ca955 A |
102 | */ |
103 | typedef uint32_t U_CALLCONV | |
104 | UDataReadUInt32(uint32_t x); | |
105 | ||
106 | /** | |
107 | * Convert one uint16_t from platform to input endianness. | |
73c04bcf | 108 | * @internal ICU 2.8 |
374ca955 A |
109 | */ |
110 | typedef void U_CALLCONV | |
111 | UDataWriteUInt16(uint16_t *p, uint16_t x); | |
112 | ||
113 | /** | |
114 | * Convert one uint32_t from platform to input endianness. | |
73c04bcf | 115 | * @internal ICU 2.8 |
374ca955 A |
116 | */ |
117 | typedef void U_CALLCONV | |
118 | UDataWriteUInt32(uint32_t *p, uint32_t x); | |
119 | ||
120 | /** | |
121 | * Compare invariant-character strings, one in the output data and the | |
122 | * other one caller-provided in Unicode. | |
123 | * An output data string is compared because strings are usually swapped | |
124 | * before the rest of the data, to allow for sorting of string tables | |
125 | * according to the output charset. | |
126 | * You can use -1 for the length parameters of NUL-terminated strings as usual. | |
127 | * Returns Unicode code point order for invariant characters. | |
73c04bcf | 128 | * @internal ICU 2.8 |
374ca955 A |
129 | */ |
130 | typedef int32_t U_CALLCONV | |
131 | UDataCompareInvChars(const UDataSwapper *ds, | |
132 | const char *outString, int32_t outLength, | |
133 | const UChar *localString, int32_t localLength); | |
134 | ||
135 | /** | |
136 | * Function for message output when an error occurs during data swapping. | |
137 | * A format string and variable number of arguments are passed | |
138 | * like for vprintf(). | |
139 | * | |
140 | * @param context A function-specific context pointer. | |
141 | * @param fmt The format string. | |
142 | * @param args The arguments for format string inserts. | |
143 | * | |
73c04bcf | 144 | * @internal ICU 2.8 |
374ca955 A |
145 | */ |
146 | typedef void U_CALLCONV | |
147 | UDataPrintError(void *context, const char *fmt, va_list args); | |
148 | ||
149 | struct UDataSwapper { | |
73c04bcf | 150 | /** Input endianness. @internal ICU 2.8 */ |
374ca955 | 151 | UBool inIsBigEndian; |
73c04bcf | 152 | /** Input charset family. @see U_CHARSET_FAMILY @internal ICU 2.8 */ |
374ca955 | 153 | uint8_t inCharset; |
73c04bcf | 154 | /** Output endianness. @internal ICU 2.8 */ |
374ca955 | 155 | UBool outIsBigEndian; |
73c04bcf | 156 | /** Output charset family. @see U_CHARSET_FAMILY @internal ICU 2.8 */ |
374ca955 A |
157 | uint8_t outCharset; |
158 | ||
159 | /* basic functions for reading data values */ | |
160 | ||
73c04bcf | 161 | /** Convert one uint16_t from input to platform endianness. @internal ICU 2.8 */ |
374ca955 | 162 | UDataReadUInt16 *readUInt16; |
73c04bcf | 163 | /** Convert one uint32_t from input to platform endianness. @internal ICU 2.8 */ |
374ca955 | 164 | UDataReadUInt32 *readUInt32; |
73c04bcf | 165 | /** Compare an invariant-character output string with a local one. @internal ICU 2.8 */ |
374ca955 A |
166 | UDataCompareInvChars *compareInvChars; |
167 | ||
168 | /* basic functions for writing data values */ | |
169 | ||
73c04bcf | 170 | /** Convert one uint16_t from platform to input endianness. @internal ICU 2.8 */ |
374ca955 | 171 | UDataWriteUInt16 *writeUInt16; |
73c04bcf | 172 | /** Convert one uint32_t from platform to input endianness. @internal ICU 2.8 */ |
374ca955 A |
173 | UDataWriteUInt32 *writeUInt32; |
174 | ||
175 | /* basic functions for data transformations */ | |
176 | ||
73c04bcf | 177 | /** Transform an array of 16-bit integers. @internal ICU 2.8 */ |
374ca955 | 178 | UDataSwapFn *swapArray16; |
73c04bcf | 179 | /** Transform an array of 32-bit integers. @internal ICU 2.8 */ |
374ca955 | 180 | UDataSwapFn *swapArray32; |
73c04bcf | 181 | /** Transform an invariant-character string. @internal ICU 2.8 */ |
374ca955 A |
182 | UDataSwapFn *swapInvChars; |
183 | ||
184 | /** | |
185 | * Function for message output when an error occurs during data swapping. | |
186 | * Can be NULL. | |
73c04bcf | 187 | * @internal ICU 2.8 |
374ca955 A |
188 | */ |
189 | UDataPrintError *printError; | |
73c04bcf | 190 | /** Context pointer for printError. @internal ICU 2.8 */ |
374ca955 A |
191 | void *printErrorContext; |
192 | }; | |
193 | ||
194 | U_CDECL_END | |
195 | ||
196 | U_CAPI UDataSwapper * U_EXPORT2 | |
197 | udata_openSwapper(UBool inIsBigEndian, uint8_t inCharset, | |
198 | UBool outIsBigEndian, uint8_t outCharset, | |
199 | UErrorCode *pErrorCode); | |
200 | ||
201 | /** | |
202 | * Open a UDataSwapper for the given input data and the specified output | |
203 | * characteristics. | |
204 | * Values of -1 for any of the characteristics mean the local platform's | |
205 | * characteristics. | |
206 | * | |
207 | * @see udata_swap | |
73c04bcf | 208 | * @internal ICU 2.8 |
374ca955 A |
209 | */ |
210 | U_CAPI UDataSwapper * U_EXPORT2 | |
211 | udata_openSwapperForInputData(const void *data, int32_t length, | |
212 | UBool outIsBigEndian, uint8_t outCharset, | |
213 | UErrorCode *pErrorCode); | |
214 | ||
215 | U_CAPI void U_EXPORT2 | |
216 | udata_closeSwapper(UDataSwapper *ds); | |
217 | ||
218 | /** | |
219 | * Read the beginning of an ICU data piece, recognize magic bytes, | |
220 | * swap the structure. | |
221 | * Set a U_UNSUPPORTED_ERROR if it does not look like an ICU data piece. | |
222 | * | |
223 | * @return The size of the data header, in bytes. | |
224 | * | |
73c04bcf | 225 | * @internal ICU 2.8 |
374ca955 A |
226 | */ |
227 | U_CAPI int32_t U_EXPORT2 | |
228 | udata_swapDataHeader(const UDataSwapper *ds, | |
229 | const void *inData, int32_t length, void *outData, | |
230 | UErrorCode *pErrorCode); | |
231 | ||
232 | /** | |
233 | * Convert one int16_t from input to platform endianness. | |
73c04bcf | 234 | * @internal ICU 2.8 |
374ca955 A |
235 | */ |
236 | U_CAPI int16_t U_EXPORT2 | |
237 | udata_readInt16(const UDataSwapper *ds, int16_t x); | |
238 | ||
239 | /** | |
240 | * Convert one int32_t from input to platform endianness. | |
73c04bcf | 241 | * @internal ICU 2.8 |
374ca955 A |
242 | */ |
243 | U_CAPI int32_t U_EXPORT2 | |
244 | udata_readInt32(const UDataSwapper *ds, int32_t x); | |
245 | ||
246 | /** | |
247 | * Swap a block of invariant, NUL-terminated strings, but not padding | |
248 | * bytes after the last string. | |
249 | * @internal | |
250 | */ | |
251 | U_CAPI int32_t U_EXPORT2 | |
252 | udata_swapInvStringBlock(const UDataSwapper *ds, | |
253 | const void *inData, int32_t length, void *outData, | |
254 | UErrorCode *pErrorCode); | |
255 | ||
256 | U_CAPI void U_EXPORT2 | |
257 | udata_printError(const UDataSwapper *ds, | |
258 | const char *fmt, | |
259 | ...); | |
260 | ||
261 | /* internal exports from putil.c -------------------------------------------- */ | |
262 | ||
263 | /* declared here to keep them out of the public putil.h */ | |
264 | ||
265 | /** | |
266 | * Swap invariant char * strings ASCII->EBCDIC. | |
267 | * @internal | |
268 | */ | |
73c04bcf | 269 | U_CAPI int32_t U_EXPORT2 |
374ca955 A |
270 | uprv_ebcdicFromAscii(const UDataSwapper *ds, |
271 | const void *inData, int32_t length, void *outData, | |
272 | UErrorCode *pErrorCode); | |
273 | ||
274 | /** | |
275 | * Copy invariant ASCII char * strings and verify they are invariant. | |
276 | * @internal | |
277 | */ | |
278 | U_CFUNC int32_t | |
279 | uprv_copyAscii(const UDataSwapper *ds, | |
280 | const void *inData, int32_t length, void *outData, | |
281 | UErrorCode *pErrorCode); | |
282 | ||
283 | /** | |
284 | * Swap invariant char * strings EBCDIC->ASCII. | |
285 | * @internal | |
286 | */ | |
287 | U_CFUNC int32_t | |
288 | uprv_asciiFromEbcdic(const UDataSwapper *ds, | |
289 | const void *inData, int32_t length, void *outData, | |
290 | UErrorCode *pErrorCode); | |
291 | ||
292 | /** | |
293 | * Copy invariant EBCDIC char * strings and verify they are invariant. | |
294 | * @internal | |
295 | */ | |
296 | U_CFUNC int32_t | |
297 | uprv_copyEbcdic(const UDataSwapper *ds, | |
298 | const void *inData, int32_t length, void *outData, | |
299 | UErrorCode *pErrorCode); | |
300 | ||
301 | /** | |
302 | * Compare ASCII invariant char * with Unicode invariant UChar * | |
303 | * @internal | |
304 | */ | |
305 | U_CFUNC int32_t | |
306 | uprv_compareInvAscii(const UDataSwapper *ds, | |
307 | const char *outString, int32_t outLength, | |
308 | const UChar *localString, int32_t localLength); | |
309 | ||
310 | /** | |
311 | * Compare EBCDIC invariant char * with Unicode invariant UChar * | |
312 | * @internal | |
313 | */ | |
314 | U_CFUNC int32_t | |
315 | uprv_compareInvEbcdic(const UDataSwapper *ds, | |
316 | const char *outString, int32_t outLength, | |
317 | const UChar *localString, int32_t localLength); | |
318 | ||
319 | /* material... -------------------------------------------------------------- */ | |
320 | ||
321 | #if 0 | |
322 | ||
323 | /* udata.h */ | |
324 | ||
325 | /** | |
326 | * Public API function in udata.c | |
327 | * | |
328 | * Same as udata_openChoice() but automatically swaps the data. | |
329 | * isAcceptable, if not NULL, may accept data with endianness and charset family | |
330 | * different from the current platform's properties. | |
331 | * If the data is acceptable and the platform properties do not match, then | |
332 | * the swap function is called to swap an allocated version of the data. | |
333 | * Preflighting may or may not be performed depending on whether the size of | |
334 | * the loaded data item is known. | |
335 | * | |
336 | * @param isAcceptable Same as for udata_openChoice(). May be NULL. | |
337 | * | |
73c04bcf | 338 | * @internal ICU 2.8 |
374ca955 A |
339 | */ |
340 | U_CAPI UDataMemory * U_EXPORT2 | |
341 | udata_openSwap(const char *path, const char *type, const char *name, | |
342 | UDataMemoryIsAcceptable *isAcceptable, void *isAcceptableContext, | |
343 | UDataSwapFn *swap, | |
344 | UDataPrintError *printError, void *printErrorContext, | |
345 | UErrorCode *pErrorCode); | |
346 | ||
347 | #endif | |
348 | ||
349 | #endif |